diff --git "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" --- "a/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" +++ "b/wandb/run-20220504_142129-1tmxz74i/files/wandb-summary.json" @@ -1 +1 @@ -{"train/loss": 3.8403, "train/learning_rate": 0.000204047622251611, "train/epoch": 1.23, "train/global_step": 4000, "_runtime": 37359, "_timestamp": 1651711448, "_step": 4007, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 8.0, 21.0, 61.0, 203.0, 302.0, 217.0, 121.0, 53.0, 19.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.325448513031006, -6.183903694152832, -6.042358875274658, -5.900814056396484, -5.759269714355469, -5.617724895477295, -5.476180076599121, -5.334635257720947, -5.193090438842773, -5.0515456199646, -4.910000801086426, -4.76845645904541, -4.626911640167236, -4.4853668212890625, -4.343822002410889, -4.202277183532715, -4.060732841491699, -3.9191880226135254, -3.7776434421539307, -3.636098623275757, -3.494553804397583, -3.3530092239379883, -3.2114644050598145, -3.0699195861816406, -2.928374767303467, -2.786829948425293, -2.6452853679656982, -2.5037405490875244, -2.3621957302093506, -2.220651149749756, -2.079106330871582, -1.9375615119934082, -1.7960166931152344, -1.65447199344635, -1.5129271745681763, -1.371382474899292, -1.2298376560211182, -1.0882929563522339, -0.9467482566833496, -0.8052034974098206, -0.6636587381362915, -0.5221139788627625, -0.3805692493915558, -0.23902451992034912, -0.09747976064682007, 0.044064998626708984, 0.18560969829559326, 0.3271544575691223, 0.46869921684265137, 0.6102439761161804, 0.7517887353897095, 0.8933334350585938, 1.0348782539367676, 1.1764229536056519, 1.3179676532745361, 1.45951247215271, 1.6010571718215942, 1.7426018714904785, 1.8841466903686523, 2.025691509246826, 2.167236089706421, 2.3087809085845947, 2.4503254890441895, 2.5918703079223633, 2.733415126800537]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 7.0, 7.0, 14.0, 8.0, 17.0, 15.0, 16.0, 21.0, 25.0, 17.0, 39.0, 30.0, 33.0, 35.0, 27.0, 50.0, 36.0, 42.0, 48.0, 39.0, 27.0, 48.0, 40.0, 31.0, 34.0, 37.0, 27.0, 33.0, 36.0, 26.0, 23.0, 19.0, 21.0, 21.0, 6.0, 8.0, 7.0, 7.0, 8.0, 9.0, 2.0, 4.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.8047726154327393, -2.7282562255859375, -2.6517398357391357, -2.575223445892334, -2.4987070560455322, -2.4221906661987305, -2.3456742763519287, -2.269157886505127, -2.192641258239746, -2.1161248683929443, -2.0396084785461426, -1.9630920886993408, -1.886575698852539, -1.8100593090057373, -1.733542799949646, -1.6570264101028442, -1.580510139465332, -1.5039937496185303, -1.4274773597717285, -1.3509609699249268, -1.274444580078125, -1.1979281902313232, -1.121411681175232, -1.0448952913284302, -0.9683789014816284, -0.8918625116348267, -0.8153461217880249, -0.7388296723365784, -0.6623132824897766, -0.5857968926429749, -0.5092804431915283, -0.43276405334472656, -0.3562474250793457, -0.27973103523254395, -0.2032146155834198, -0.12669821083545685, -0.050181806087493896, 0.02633458375930786, 0.102851003408432, 0.17936742305755615, 0.2558838129043579, 0.33240020275115967, 0.4089166224002838, 0.48543304204940796, 0.5619494318962097, 0.6384658217430115, 0.714982271194458, 0.7914986610412598, 0.8680150508880615, 0.9445314407348633, 1.021047830581665, 1.0975642204284668, 1.1740806102752686, 1.2505970001220703, 1.3271135091781616, 1.4036298990249634, 1.4801462888717651, 1.556662678718567, 1.6331790685653687, 1.7096954584121704, 1.7862119674682617, 1.8627283573150635, 1.9392447471618652, 2.015761137008667, 2.0922775268554688]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 3.0, 8.0, 12.0, 19.0, 18.0, 28.0, 49.0, 57.0, 104.0, 116.0, 211.0, 314.0, 483.0, 911.0, 1667.0, 3024.0, 5978.0, 12179.0, 26297.0, 55289.0, 127044.0, 483441.0, 2848862.0, 412862.0, 115660.0, 51402.0, 24359.0, 11554.0, 5683.0, 2911.0, 1501.0, 894.0, 460.0, 280.0, 207.0, 137.0, 86.0, 62.0, 27.0, 17.0, 19.0, 14.0, 9.0, 6.0, 7.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.814453125, -1.760223388671875, -1.70599365234375, -1.651763916015625, -1.5975341796875, -1.543304443359375, -1.48907470703125, -1.434844970703125, -1.380615234375, -1.326385498046875, -1.27215576171875, -1.217926025390625, -1.1636962890625, -1.109466552734375, -1.05523681640625, -1.001007080078125, -0.94677734375, -0.892547607421875, -0.83831787109375, -0.784088134765625, -0.7298583984375, -0.675628662109375, -0.62139892578125, -0.567169189453125, -0.512939453125, -0.458709716796875, -0.40447998046875, -0.350250244140625, -0.2960205078125, -0.241790771484375, -0.18756103515625, -0.133331298828125, -0.0791015625, -0.024871826171875, 0.02935791015625, 0.083587646484375, 0.1378173828125, 0.192047119140625, 0.24627685546875, 0.300506591796875, 0.354736328125, 0.408966064453125, 0.46319580078125, 0.517425537109375, 0.5716552734375, 0.625885009765625, 0.68011474609375, 0.734344482421875, 0.78857421875, 0.842803955078125, 0.89703369140625, 0.951263427734375, 1.0054931640625, 1.059722900390625, 1.11395263671875, 1.168182373046875, 1.222412109375, 1.276641845703125, 1.33087158203125, 1.385101318359375, 1.4393310546875, 1.493560791015625, 1.54779052734375, 1.602020263671875, 1.65625]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 9.0, 3.0, 4.0, 8.0, 7.0, 11.0, 16.0, 16.0, 19.0, 15.0, 22.0, 21.0, 33.0, 24.0, 35.0, 38.0, 47.0, 34.0, 34.0, 50.0, 46.0, 35.0, 36.0, 34.0, 35.0, 40.0, 28.0, 33.0, 40.0, 33.0, 25.0, 31.0, 18.0, 26.0, 11.0, 12.0, 16.0, 8.0, 11.0, 12.0, 7.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.3046875, -2.235565185546875, -2.16644287109375, -2.097320556640625, -2.0281982421875, -1.959075927734375, -1.88995361328125, -1.820831298828125, -1.751708984375, -1.682586669921875, -1.61346435546875, -1.544342041015625, -1.4752197265625, -1.406097412109375, -1.33697509765625, -1.267852783203125, -1.19873046875, -1.129608154296875, -1.06048583984375, -0.991363525390625, -0.9222412109375, -0.853118896484375, -0.78399658203125, -0.714874267578125, -0.645751953125, -0.576629638671875, -0.50750732421875, -0.438385009765625, -0.3692626953125, -0.300140380859375, -0.23101806640625, -0.161895751953125, -0.0927734375, -0.023651123046875, 0.04547119140625, 0.114593505859375, 0.1837158203125, 0.252838134765625, 0.32196044921875, 0.391082763671875, 0.460205078125, 0.529327392578125, 0.59844970703125, 0.667572021484375, 0.7366943359375, 0.805816650390625, 0.87493896484375, 0.944061279296875, 1.01318359375, 1.082305908203125, 1.15142822265625, 1.220550537109375, 1.2896728515625, 1.358795166015625, 1.42791748046875, 1.497039794921875, 1.566162109375, 1.635284423828125, 1.70440673828125, 1.773529052734375, 1.8426513671875, 1.911773681640625, 1.98089599609375, 2.050018310546875, 2.119140625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 5.0, 10.0, 12.0, 21.0, 15.0, 16.0, 26.0, 40.0, 57.0, 85.0, 171.0, 761.0, 4189463.0, 3000.0, 230.0, 95.0, 73.0, 40.0, 43.0, 22.0, 23.0, 16.0, 11.0, 6.0, 5.0, 9.0, 5.0, 3.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-54.0, -52.396484375, -50.79296875, -49.189453125, -47.5859375, -45.982421875, -44.37890625, -42.775390625, -41.171875, -39.568359375, -37.96484375, -36.361328125, -34.7578125, -33.154296875, -31.55078125, -29.947265625, -28.34375, -26.740234375, -25.13671875, -23.533203125, -21.9296875, -20.326171875, -18.72265625, -17.119140625, -15.515625, -13.912109375, -12.30859375, -10.705078125, -9.1015625, -7.498046875, -5.89453125, -4.291015625, -2.6875, -1.083984375, 0.51953125, 2.123046875, 3.7265625, 5.330078125, 6.93359375, 8.537109375, 10.140625, 11.744140625, 13.34765625, 14.951171875, 16.5546875, 18.158203125, 19.76171875, 21.365234375, 22.96875, 24.572265625, 26.17578125, 27.779296875, 29.3828125, 30.986328125, 32.58984375, 34.193359375, 35.796875, 37.400390625, 39.00390625, 40.607421875, 42.2109375, 43.814453125, 45.41796875, 47.021484375, 48.625]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 14.0, 17.0, 24.0, 15.0, 29.0, 30.0, 47.0, 88.0, 134.0, 295.0, 1525.0, 1216.0, 225.0, 104.0, 68.0, 43.0, 39.0, 31.0, 23.0, 24.0, 13.0, 6.0, 11.0, 11.0, 1.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.041015625, -1.0093612670898438, -0.9777069091796875, -0.9460525512695312, -0.914398193359375, -0.8827438354492188, -0.8510894775390625, -0.8194351196289062, -0.78778076171875, -0.7561264038085938, -0.7244720458984375, -0.6928176879882812, -0.661163330078125, -0.6295089721679688, -0.5978546142578125, -0.5662002563476562, -0.5345458984375, -0.5028915405273438, -0.4712371826171875, -0.43958282470703125, -0.407928466796875, -0.37627410888671875, -0.3446197509765625, -0.31296539306640625, -0.28131103515625, -0.24965667724609375, -0.2180023193359375, -0.18634796142578125, -0.154693603515625, -0.12303924560546875, -0.0913848876953125, -0.05973052978515625, -0.028076171875, 0.00357818603515625, 0.0352325439453125, 0.06688690185546875, 0.098541259765625, 0.13019561767578125, 0.1618499755859375, 0.19350433349609375, 0.22515869140625, 0.25681304931640625, 0.2884674072265625, 0.32012176513671875, 0.351776123046875, 0.38343048095703125, 0.4150848388671875, 0.44673919677734375, 0.4783935546875, 0.5100479125976562, 0.5417022705078125, 0.5733566284179688, 0.605010986328125, 0.6366653442382812, 0.6683197021484375, 0.6999740600585938, 0.73162841796875, 0.7632827758789062, 0.7949371337890625, 0.8265914916992188, 0.858245849609375, 0.8899002075195312, 0.9215545654296875, 0.9532089233398438, 0.98486328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 11.0, 14.0, 23.0, 40.0, 58.0, 101.0, 151.0, 150.0, 138.0, 119.0, 68.0, 49.0, 34.0, 14.0, 9.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2154412269592285, -6.0589518547058105, -5.902462005615234, -5.745972633361816, -5.589483261108398, -5.4329938888549805, -5.276504039764404, -5.120014667510986, -4.963525295257568, -4.80703592300415, -4.650546073913574, -4.494056701660156, -4.337567329406738, -4.18107795715332, -4.024588108062744, -3.868098735809326, -3.711609125137329, -3.555119514465332, -3.398630142211914, -3.242140531539917, -3.085651159286499, -2.929161548614502, -2.772672176361084, -2.616182565689087, -2.45969295501709, -2.3032033443450928, -2.146713972091675, -1.9902243614196777, -1.8337349891662598, -1.6772453784942627, -1.5207558870315552, -1.3642663955688477, -1.2077770233154297, -1.0512875318527222, -0.8947980403900146, -0.7383084893226624, -0.5818189978599548, -0.4253295063972473, -0.268839955329895, -0.1123504638671875, 0.04413902759552002, 0.20062853395938873, 0.35711804032325745, 0.5136075615882874, 0.6700970530509949, 0.8265865445137024, 0.9830760955810547, 1.1395655870437622, 1.2960550785064697, 1.4525445699691772, 1.6090340614318848, 1.7655236721038818, 1.9220130443572998, 2.078502655029297, 2.234992027282715, 2.391481637954712, 2.547971248626709, 2.704460859298706, 2.860950231552124, 3.017439842224121, 3.173929214477539, 3.330418825149536, 3.486908435821533, 3.643397808074951, 3.799887180328369]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 7.0, 6.0, 8.0, 13.0, 6.0, 19.0, 17.0, 22.0, 22.0, 23.0, 26.0, 33.0, 35.0, 40.0, 45.0, 46.0, 48.0, 30.0, 44.0, 44.0, 42.0, 40.0, 54.0, 52.0, 31.0, 32.0, 34.0, 42.0, 25.0, 21.0, 24.0, 17.0, 14.0, 12.0, 9.0, 10.0, 0.0, 3.0, 3.0, 6.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.6971004009246826, -2.620529890060425, -2.543959379196167, -2.467388868331909, -2.3908183574676514, -2.3142478466033936, -2.2376773357391357, -2.161106824874878, -2.08453631401062, -2.0079658031463623, -1.9313952922821045, -1.8548247814178467, -1.7782542705535889, -1.701683759689331, -1.6251132488250732, -1.5485427379608154, -1.4719722270965576, -1.3954017162322998, -1.318831205368042, -1.2422606945037842, -1.1656901836395264, -1.0891196727752686, -1.0125491619110107, -0.9359786510467529, -0.8594081401824951, -0.7828376293182373, -0.7062671184539795, -0.6296966075897217, -0.5531260967254639, -0.47655558586120605, -0.39998507499694824, -0.32341456413269043, -0.24684429168701172, -0.1702737808227539, -0.0937032699584961, -0.01713275909423828, 0.05943775177001953, 0.13600826263427734, 0.21257877349853516, 0.28914928436279297, 0.3657197952270508, 0.4422903060913086, 0.5188608169555664, 0.5954313278198242, 0.672001838684082, 0.7485723495483398, 0.8251428604125977, 0.9017133712768555, 0.9782838821411133, 1.054854393005371, 1.131424903869629, 1.2079954147338867, 1.2845659255981445, 1.3611364364624023, 1.4377069473266602, 1.514277458190918, 1.5908479690551758, 1.6674184799194336, 1.7439889907836914, 1.8205595016479492, 1.897130012512207, 1.9737005233764648, 2.0502710342407227, 2.1268415451049805, 2.2034120559692383]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 8.0, 10.0, 17.0, 19.0, 34.0, 32.0, 48.0, 63.0, 66.0, 123.0, 157.0, 205.0, 282.0, 442.0, 614.0, 1158.0, 2713.0, 8135.0, 33120.0, 168884.0, 568355.0, 208175.0, 39783.0, 9574.0, 2968.0, 1333.0, 623.0, 437.0, 307.0, 219.0, 150.0, 132.0, 83.0, 72.0, 51.0, 36.0, 25.0, 16.0, 12.0, 12.0, 13.0, 8.0, 9.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.3837890625, -0.3712310791015625, -0.358673095703125, -0.3461151123046875, -0.33355712890625, -0.3209991455078125, -0.308441162109375, -0.2958831787109375, -0.2833251953125, -0.2707672119140625, -0.258209228515625, -0.2456512451171875, -0.23309326171875, -0.2205352783203125, -0.207977294921875, -0.1954193115234375, -0.182861328125, -0.1703033447265625, -0.157745361328125, -0.1451873779296875, -0.13262939453125, -0.1200714111328125, -0.107513427734375, -0.0949554443359375, -0.0823974609375, -0.0698394775390625, -0.057281494140625, -0.0447235107421875, -0.03216552734375, -0.0196075439453125, -0.007049560546875, 0.0055084228515625, 0.01806640625, 0.0306243896484375, 0.043182373046875, 0.0557403564453125, 0.06829833984375, 0.0808563232421875, 0.093414306640625, 0.1059722900390625, 0.1185302734375, 0.1310882568359375, 0.143646240234375, 0.1562042236328125, 0.16876220703125, 0.1813201904296875, 0.193878173828125, 0.2064361572265625, 0.218994140625, 0.2315521240234375, 0.244110107421875, 0.2566680908203125, 0.26922607421875, 0.2817840576171875, 0.294342041015625, 0.3069000244140625, 0.3194580078125, 0.3320159912109375, 0.344573974609375, 0.3571319580078125, 0.36968994140625, 0.3822479248046875, 0.394805908203125, 0.4073638916015625, 0.419921875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 6.0, 6.0, 5.0, 12.0, 19.0, 12.0, 23.0, 29.0, 16.0, 21.0, 26.0, 29.0, 28.0, 32.0, 34.0, 40.0, 41.0, 52.0, 39.0, 52.0, 43.0, 31.0, 44.0, 49.0, 41.0, 34.0, 35.0, 27.0, 35.0, 13.0, 21.0, 12.0, 19.0, 19.0, 11.0, 9.0, 13.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-1.9296875, -1.8748626708984375, -1.820037841796875, -1.7652130126953125, -1.71038818359375, -1.6555633544921875, -1.600738525390625, -1.5459136962890625, -1.4910888671875, -1.4362640380859375, -1.381439208984375, -1.3266143798828125, -1.27178955078125, -1.2169647216796875, -1.162139892578125, -1.1073150634765625, -1.052490234375, -0.9976654052734375, -0.942840576171875, -0.8880157470703125, -0.83319091796875, -0.7783660888671875, -0.723541259765625, -0.6687164306640625, -0.6138916015625, -0.5590667724609375, -0.504241943359375, -0.4494171142578125, -0.39459228515625, -0.3397674560546875, -0.284942626953125, -0.2301177978515625, -0.17529296875, -0.1204681396484375, -0.065643310546875, -0.0108184814453125, 0.04400634765625, 0.0988311767578125, 0.153656005859375, 0.2084808349609375, 0.2633056640625, 0.3181304931640625, 0.372955322265625, 0.4277801513671875, 0.48260498046875, 0.5374298095703125, 0.592254638671875, 0.6470794677734375, 0.701904296875, 0.7567291259765625, 0.811553955078125, 0.8663787841796875, 0.92120361328125, 0.9760284423828125, 1.030853271484375, 1.0856781005859375, 1.1405029296875, 1.1953277587890625, 1.250152587890625, 1.3049774169921875, 1.35980224609375, 1.4146270751953125, 1.469451904296875, 1.5242767333984375, 1.5791015625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 14.0, 6.0, 8.0, 9.0, 8.0, 16.0, 26.0, 35.0, 36.0, 55.0, 53.0, 100.0, 100.0, 135.0, 192.0, 237.0, 312.0, 499.0, 1147.0, 4563.0, 26246.0, 213310.0, 661344.0, 117921.0, 16401.0, 3106.0, 925.0, 425.0, 300.0, 236.0, 180.0, 136.0, 91.0, 79.0, 72.0, 64.0, 44.0, 31.0, 24.0, 14.0, 15.0, 8.0, 7.0, 13.0, 5.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30517578125, -0.2954444885253906, -0.28571319580078125, -0.2759819030761719, -0.2662506103515625, -0.2565193176269531, -0.24678802490234375, -0.23705673217773438, -0.227325439453125, -0.21759414672851562, -0.20786285400390625, -0.19813156127929688, -0.1884002685546875, -0.17866897583007812, -0.16893768310546875, -0.15920639038085938, -0.14947509765625, -0.13974380493164062, -0.13001251220703125, -0.12028121948242188, -0.1105499267578125, -0.10081863403320312, -0.09108734130859375, -0.08135604858398438, -0.071624755859375, -0.061893463134765625, -0.05216217041015625, -0.042430877685546875, -0.0326995849609375, -0.022968292236328125, -0.01323699951171875, -0.003505706787109375, 0.0062255859375, 0.015956878662109375, 0.02568817138671875, 0.035419464111328125, 0.0451507568359375, 0.054882049560546875, 0.06461334228515625, 0.07434463500976562, 0.084075927734375, 0.09380722045898438, 0.10353851318359375, 0.11326980590820312, 0.1230010986328125, 0.13273239135742188, 0.14246368408203125, 0.15219497680664062, 0.16192626953125, 0.17165756225585938, 0.18138885498046875, 0.19112014770507812, 0.2008514404296875, 0.21058273315429688, 0.22031402587890625, 0.23004531860351562, 0.239776611328125, 0.24950790405273438, 0.25923919677734375, 0.2689704895019531, 0.2787017822265625, 0.2884330749511719, 0.29816436767578125, 0.3078956604003906, 0.317626953125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 1.0, 5.0, 9.0, 10.0, 13.0, 11.0, 9.0, 10.0, 14.0, 17.0, 26.0, 28.0, 37.0, 27.0, 30.0, 31.0, 30.0, 45.0, 37.0, 43.0, 42.0, 40.0, 38.0, 42.0, 38.0, 43.0, 27.0, 25.0, 35.0, 35.0, 31.0, 33.0, 19.0, 13.0, 23.0, 20.0, 9.0, 12.0, 9.0, 3.0, 9.0, 3.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.228515625, -3.121917724609375, -3.01531982421875, -2.908721923828125, -2.8021240234375, -2.695526123046875, -2.58892822265625, -2.482330322265625, -2.375732421875, -2.269134521484375, -2.16253662109375, -2.055938720703125, -1.9493408203125, -1.842742919921875, -1.73614501953125, -1.629547119140625, -1.52294921875, -1.416351318359375, -1.30975341796875, -1.203155517578125, -1.0965576171875, -0.989959716796875, -0.88336181640625, -0.776763916015625, -0.670166015625, -0.563568115234375, -0.45697021484375, -0.350372314453125, -0.2437744140625, -0.137176513671875, -0.03057861328125, 0.076019287109375, 0.1826171875, 0.289215087890625, 0.39581298828125, 0.502410888671875, 0.6090087890625, 0.715606689453125, 0.82220458984375, 0.928802490234375, 1.035400390625, 1.141998291015625, 1.24859619140625, 1.355194091796875, 1.4617919921875, 1.568389892578125, 1.67498779296875, 1.781585693359375, 1.88818359375, 1.994781494140625, 2.10137939453125, 2.207977294921875, 2.3145751953125, 2.421173095703125, 2.52777099609375, 2.634368896484375, 2.740966796875, 2.847564697265625, 2.95416259765625, 3.060760498046875, 3.1673583984375, 3.273956298828125, 3.38055419921875, 3.487152099609375, 3.59375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 12.0, 15.0, 16.0, 29.0, 41.0, 67.0, 113.0, 232.0, 407.0, 837.0, 2297.0, 36544.0, 971513.0, 32396.0, 2324.0, 762.0, 423.0, 194.0, 114.0, 83.0, 48.0, 24.0, 19.0, 9.0, 2.0, 5.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06884765625, -0.06666088104248047, -0.06447410583496094, -0.062287330627441406, -0.060100555419921875, -0.057913780212402344, -0.05572700500488281, -0.05354022979736328, -0.05135345458984375, -0.04916667938232422, -0.04697990417480469, -0.044793128967285156, -0.042606353759765625, -0.040419578552246094, -0.03823280334472656, -0.03604602813720703, -0.0338592529296875, -0.03167247772216797, -0.029485702514648438, -0.027298927307128906, -0.025112152099609375, -0.022925376892089844, -0.020738601684570312, -0.01855182647705078, -0.01636505126953125, -0.014178276062011719, -0.011991500854492188, -0.009804725646972656, -0.007617950439453125, -0.005431175231933594, -0.0032444000244140625, -0.0010576248168945312, 0.001129150390625, 0.0033159255981445312, 0.0055027008056640625, 0.007689476013183594, 0.009876251220703125, 0.012063026428222656, 0.014249801635742188, 0.01643657684326172, 0.01862335205078125, 0.02081012725830078, 0.022996902465820312, 0.025183677673339844, 0.027370452880859375, 0.029557228088378906, 0.03174400329589844, 0.03393077850341797, 0.0361175537109375, 0.03830432891845703, 0.04049110412597656, 0.042677879333496094, 0.044864654541015625, 0.047051429748535156, 0.04923820495605469, 0.05142498016357422, 0.05361175537109375, 0.05579853057861328, 0.05798530578613281, 0.060172080993652344, 0.062358856201171875, 0.0645456314086914, 0.06673240661621094, 0.06891918182373047, 0.07110595703125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 10.0, 6.0, 5.0, 9.0, 15.0, 24.0, 22.0, 36.0, 33.0, 56.0, 63.0, 76.0, 65.0, 78.0, 88.0, 75.0, 81.0, 60.0, 42.0, 41.0, 33.0, 19.0, 17.0, 12.0, 8.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0219554901123047e-05, -2.930406481027603e-05, -2.8388574719429016e-05, -2.7473084628582e-05, -2.6557594537734985e-05, -2.564210444688797e-05, -2.4726614356040955e-05, -2.381112426519394e-05, -2.2895634174346924e-05, -2.198014408349991e-05, -2.1064653992652893e-05, -2.0149163901805878e-05, -1.9233673810958862e-05, -1.8318183720111847e-05, -1.740269362926483e-05, -1.6487203538417816e-05, -1.55717134475708e-05, -1.4656223356723785e-05, -1.374073326587677e-05, -1.2825243175029755e-05, -1.190975308418274e-05, -1.0994262993335724e-05, -1.0078772902488708e-05, -9.163282811641693e-06, -8.247792720794678e-06, -7.332302629947662e-06, -6.416812539100647e-06, -5.501322448253632e-06, -4.585832357406616e-06, -3.670342266559601e-06, -2.7548521757125854e-06, -1.83936208486557e-06, -9.238719940185547e-07, -8.381903171539307e-09, 9.071081876754761e-07, 1.8225982785224915e-06, 2.738088369369507e-06, 3.6535784602165222e-06, 4.569068551063538e-06, 5.484558641910553e-06, 6.400048732757568e-06, 7.315538823604584e-06, 8.231028914451599e-06, 9.146519005298615e-06, 1.006200909614563e-05, 1.0977499186992645e-05, 1.189298927783966e-05, 1.2808479368686676e-05, 1.3723969459533691e-05, 1.4639459550380707e-05, 1.5554949641227722e-05, 1.6470439732074738e-05, 1.7385929822921753e-05, 1.830141991376877e-05, 1.9216910004615784e-05, 2.01324000954628e-05, 2.1047890186309814e-05, 2.196338027715683e-05, 2.2878870368003845e-05, 2.379436045885086e-05, 2.4709850549697876e-05, 2.562534064054489e-05, 2.6540830731391907e-05, 2.7456320822238922e-05, 2.8371810913085938e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 11.0, 6.0, 6.0, 5.0, 10.0, 15.0, 21.0, 32.0, 41.0, 70.0, 144.0, 380.0, 1640.0, 16632.0, 858079.0, 164002.0, 6015.0, 855.0, 259.0, 106.0, 54.0, 30.0, 22.0, 13.0, 17.0, 10.0, 12.0, 6.0, 11.0, 5.0, 9.0, 5.0, 2.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1273193359375, -0.12290000915527344, -0.11848068237304688, -0.11406135559082031, -0.10964202880859375, -0.10522270202636719, -0.10080337524414062, -0.09638404846191406, -0.0919647216796875, -0.08754539489746094, -0.08312606811523438, -0.07870674133300781, -0.07428741455078125, -0.06986808776855469, -0.06544876098632812, -0.06102943420410156, -0.056610107421875, -0.05219078063964844, -0.047771453857421875, -0.04335212707519531, -0.03893280029296875, -0.03451347351074219, -0.030094146728515625, -0.025674819946289062, -0.0212554931640625, -0.016836166381835938, -0.012416839599609375, -0.007997512817382812, -0.00357818603515625, 0.0008411407470703125, 0.005260467529296875, 0.009679794311523438, 0.01409912109375, 0.018518447875976562, 0.022937774658203125, 0.027357101440429688, 0.03177642822265625, 0.03619575500488281, 0.040615081787109375, 0.04503440856933594, 0.0494537353515625, 0.05387306213378906, 0.058292388916015625, 0.06271171569824219, 0.06713104248046875, 0.07155036926269531, 0.07596969604492188, 0.08038902282714844, 0.084808349609375, 0.08922767639160156, 0.09364700317382812, 0.09806632995605469, 0.10248565673828125, 0.10690498352050781, 0.11132431030273438, 0.11574363708496094, 0.1201629638671875, 0.12458229064941406, 0.12900161743164062, 0.1334209442138672, 0.13784027099609375, 0.1422595977783203, 0.14667892456054688, 0.15109825134277344, 0.155517578125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 5.0, 3.0, 4.0, 7.0, 6.0, 9.0, 8.0, 12.0, 12.0, 14.0, 23.0, 21.0, 35.0, 41.0, 51.0, 60.0, 99.0, 128.0, 111.0, 77.0, 70.0, 43.0, 42.0, 18.0, 14.0, 12.0, 12.0, 17.0, 13.0, 5.0, 10.0, 2.0, 3.0, 6.0, 4.0, 2.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01025390625, -0.009896516799926758, -0.009539127349853516, -0.009181737899780273, -0.008824348449707031, -0.008466958999633789, -0.008109569549560547, -0.007752180099487305, -0.0073947906494140625, -0.00703740119934082, -0.006680011749267578, -0.006322622299194336, -0.005965232849121094, -0.0056078433990478516, -0.005250453948974609, -0.004893064498901367, -0.004535675048828125, -0.004178285598754883, -0.0038208961486816406, -0.0034635066986083984, -0.0031061172485351562, -0.002748727798461914, -0.002391338348388672, -0.0020339488983154297, -0.0016765594482421875, -0.0013191699981689453, -0.0009617805480957031, -0.0006043910980224609, -0.00024700164794921875, 0.00011038780212402344, 0.0004677772521972656, 0.0008251667022705078, 0.00118255615234375, 0.0015399456024169922, 0.0018973350524902344, 0.0022547245025634766, 0.0026121139526367188, 0.002969503402709961, 0.003326892852783203, 0.0036842823028564453, 0.0040416717529296875, 0.00439906120300293, 0.004756450653076172, 0.005113840103149414, 0.005471229553222656, 0.0058286190032958984, 0.006186008453369141, 0.006543397903442383, 0.006900787353515625, 0.007258176803588867, 0.007615566253662109, 0.007972955703735352, 0.008330345153808594, 0.008687734603881836, 0.009045124053955078, 0.00940251350402832, 0.009759902954101562, 0.010117292404174805, 0.010474681854248047, 0.010832071304321289, 0.011189460754394531, 0.011546850204467773, 0.011904239654541016, 0.012261629104614258, 0.0126190185546875]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 14.0, 29.0, 58.0, 140.0, 264.0, 244.0, 147.0, 58.0, 18.0, 18.0, 6.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.962218284606934, -9.735429763793945, -9.50864028930664, -9.281851768493652, -9.055062294006348, -8.82827377319336, -8.601485252380371, -8.374695777893066, -8.147907257080078, -7.921118259429932, -7.694329261779785, -7.467540740966797, -7.24075174331665, -7.013962745666504, -6.787173748016357, -6.560384750366211, -6.333596229553223, -6.106807231903076, -5.88001823425293, -5.653229713439941, -5.426440715789795, -5.199651718139648, -4.972862720489502, -4.7460737228393555, -4.519284725189209, -4.2924957275390625, -4.065706729888916, -3.8389179706573486, -3.6121292114257812, -3.3853402137756348, -3.1585512161254883, -2.931762456893921, -2.7049736976623535, -2.478184700012207, -2.2513959407806396, -2.024606943130493, -1.7978181838989258, -1.5710291862487793, -1.3442403078079224, -1.1174514293670654, -0.8906625509262085, -0.6638736724853516, -0.43708476424217224, -0.21029585599899292, 0.016493022441864014, 0.24328196048736572, 0.47007083892822266, 0.6968597173690796, 0.9236485958099365, 1.1504374742507935, 1.3772263526916504, 1.6040153503417969, 1.8308041095733643, 2.0575931072235107, 2.284381866455078, 2.5111708641052246, 2.737959861755371, 2.9647488594055176, 3.191537618637085, 3.4183266162872314, 3.645115375518799, 3.8719043731689453, 4.098693370819092, 4.325482368469238, 4.552270889282227]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 18.0, 7.0, 9.0, 24.0, 10.0, 23.0, 23.0, 23.0, 25.0, 29.0, 42.0, 41.0, 49.0, 45.0, 40.0, 36.0, 46.0, 43.0, 38.0, 58.0, 56.0, 36.0, 40.0, 36.0, 41.0, 23.0, 28.0, 23.0, 19.0, 15.0, 10.0, 5.0, 13.0, 6.0, 3.0, 1.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9413150548934937, -1.8838117122650146, -1.8263084888458252, -1.7688051462173462, -1.7113018035888672, -1.6537985801696777, -1.5962952375411987, -1.5387918949127197, -1.4812886714935303, -1.4237853288650513, -1.3662821054458618, -1.3087787628173828, -1.2512755393981934, -1.1937721967697144, -1.1362688541412354, -1.078765630722046, -1.021262288093567, -0.9637590050697327, -0.9062557220458984, -0.8487523794174194, -0.7912490963935852, -0.733745813369751, -0.676242470741272, -0.6187391877174377, -0.5612359046936035, -0.5037326216697693, -0.44622930884361267, -0.38872599601745605, -0.3312227129936218, -0.2737194299697876, -0.21621611714363098, -0.15871280431747437, -0.10120940208435059, -0.043706104159355164, 0.013797193765640259, 0.07130049169063568, 0.1288037896156311, 0.18630707263946533, 0.24381038546562195, 0.30131369829177856, 0.3588169813156128, 0.416320264339447, 0.47382357716560364, 0.5313268899917603, 0.5888301730155945, 0.6463334560394287, 0.7038367986679077, 0.7613400816917419, 0.8188433647155762, 0.8763466477394104, 0.9338499307632446, 0.9913532733917236, 1.048856496810913, 1.106359839439392, 1.163863182067871, 1.2213664054870605, 1.2788697481155396, 1.3363730907440186, 1.393876314163208, 1.451379656791687, 1.508882999420166, 1.5663862228393555, 1.6238895654678345, 1.6813929080963135, 1.738896131515503]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 11.0, 14.0, 29.0, 45.0, 84.0, 133.0, 238.0, 383.0, 689.0, 1185.0, 2070.0, 3999.0, 7792.0, 16750.0, 43663.0, 150947.0, 571335.0, 167529.0, 46413.0, 17765.0, 8171.0, 4145.0, 2216.0, 1320.0, 693.0, 378.0, 213.0, 125.0, 82.0, 50.0, 27.0, 17.0, 7.0, 13.0, 7.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.5234375, -1.4817352294921875, -1.440032958984375, -1.3983306884765625, -1.35662841796875, -1.3149261474609375, -1.273223876953125, -1.2315216064453125, -1.1898193359375, -1.1481170654296875, -1.106414794921875, -1.0647125244140625, -1.02301025390625, -0.9813079833984375, -0.939605712890625, -0.8979034423828125, -0.856201171875, -0.8144989013671875, -0.772796630859375, -0.7310943603515625, -0.68939208984375, -0.6476898193359375, -0.605987548828125, -0.5642852783203125, -0.5225830078125, -0.4808807373046875, -0.439178466796875, -0.3974761962890625, -0.35577392578125, -0.3140716552734375, -0.272369384765625, -0.2306671142578125, -0.18896484375, -0.1472625732421875, -0.105560302734375, -0.0638580322265625, -0.02215576171875, 0.0195465087890625, 0.061248779296875, 0.1029510498046875, 0.1446533203125, 0.1863555908203125, 0.228057861328125, 0.2697601318359375, 0.31146240234375, 0.3531646728515625, 0.394866943359375, 0.4365692138671875, 0.478271484375, 0.5199737548828125, 0.561676025390625, 0.6033782958984375, 0.64508056640625, 0.6867828369140625, 0.728485107421875, 0.7701873779296875, 0.8118896484375, 0.8535919189453125, 0.895294189453125, 0.9369964599609375, 0.97869873046875, 1.0204010009765625, 1.062103271484375, 1.1038055419921875, 1.1455078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 3.0, 3.0, 10.0, 10.0, 8.0, 8.0, 17.0, 12.0, 25.0, 29.0, 28.0, 16.0, 44.0, 40.0, 35.0, 53.0, 45.0, 56.0, 51.0, 45.0, 45.0, 58.0, 36.0, 49.0, 38.0, 42.0, 22.0, 23.0, 30.0, 23.0, 19.0, 9.0, 10.0, 13.0, 10.0, 7.0, 8.0, 4.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.13671875, -4.98602294921875, -4.8353271484375, -4.68463134765625, -4.533935546875, -4.38323974609375, -4.2325439453125, -4.08184814453125, -3.93115234375, -3.78045654296875, -3.6297607421875, -3.47906494140625, -3.328369140625, -3.17767333984375, -3.0269775390625, -2.87628173828125, -2.7255859375, -2.57489013671875, -2.4241943359375, -2.27349853515625, -2.122802734375, -1.97210693359375, -1.8214111328125, -1.67071533203125, -1.52001953125, -1.36932373046875, -1.2186279296875, -1.06793212890625, -0.917236328125, -0.76654052734375, -0.6158447265625, -0.46514892578125, -0.314453125, -0.16375732421875, -0.0130615234375, 0.13763427734375, 0.288330078125, 0.43902587890625, 0.5897216796875, 0.74041748046875, 0.89111328125, 1.04180908203125, 1.1925048828125, 1.34320068359375, 1.493896484375, 1.64459228515625, 1.7952880859375, 1.94598388671875, 2.0966796875, 2.24737548828125, 2.3980712890625, 2.54876708984375, 2.699462890625, 2.85015869140625, 3.0008544921875, 3.15155029296875, 3.30224609375, 3.45294189453125, 3.6036376953125, 3.75433349609375, 3.905029296875, 4.05572509765625, 4.2064208984375, 4.35711669921875, 4.5078125]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 4.0, 5.0, 8.0, 11.0, 12.0, 22.0, 37.0, 44.0, 59.0, 93.0, 174.0, 441.0, 2293.0, 223114.0, 817753.0, 3450.0, 479.0, 209.0, 110.0, 61.0, 43.0, 31.0, 26.0, 28.0, 17.0, 12.0, 7.0, 7.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5, -7.2327880859375, -6.965576171875, -6.6983642578125, -6.43115234375, -6.1639404296875, -5.896728515625, -5.6295166015625, -5.3623046875, -5.0950927734375, -4.827880859375, -4.5606689453125, -4.29345703125, -4.0262451171875, -3.759033203125, -3.4918212890625, -3.224609375, -2.9573974609375, -2.690185546875, -2.4229736328125, -2.15576171875, -1.8885498046875, -1.621337890625, -1.3541259765625, -1.0869140625, -0.8197021484375, -0.552490234375, -0.2852783203125, -0.01806640625, 0.2491455078125, 0.516357421875, 0.7835693359375, 1.05078125, 1.3179931640625, 1.585205078125, 1.8524169921875, 2.11962890625, 2.3868408203125, 2.654052734375, 2.9212646484375, 3.1884765625, 3.4556884765625, 3.722900390625, 3.9901123046875, 4.25732421875, 4.5245361328125, 4.791748046875, 5.0589599609375, 5.326171875, 5.5933837890625, 5.860595703125, 6.1278076171875, 6.39501953125, 6.6622314453125, 6.929443359375, 7.1966552734375, 7.4638671875, 7.7310791015625, 7.998291015625, 8.2655029296875, 8.53271484375, 8.7999267578125, 9.067138671875, 9.3343505859375, 9.6015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 12.0, 4.0, 6.0, 8.0, 7.0, 14.0, 13.0, 25.0, 29.0, 27.0, 34.0, 34.0, 38.0, 44.0, 42.0, 39.0, 41.0, 54.0, 40.0, 45.0, 40.0, 45.0, 53.0, 43.0, 32.0, 29.0, 31.0, 34.0, 27.0, 18.0, 23.0, 15.0, 15.0, 11.0, 7.0, 3.0, 4.0, 8.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.66796875, -4.509033203125, -4.35009765625, -4.191162109375, -4.0322265625, -3.873291015625, -3.71435546875, -3.555419921875, -3.396484375, -3.237548828125, -3.07861328125, -2.919677734375, -2.7607421875, -2.601806640625, -2.44287109375, -2.283935546875, -2.125, -1.966064453125, -1.80712890625, -1.648193359375, -1.4892578125, -1.330322265625, -1.17138671875, -1.012451171875, -0.853515625, -0.694580078125, -0.53564453125, -0.376708984375, -0.2177734375, -0.058837890625, 0.10009765625, 0.259033203125, 0.41796875, 0.576904296875, 0.73583984375, 0.894775390625, 1.0537109375, 1.212646484375, 1.37158203125, 1.530517578125, 1.689453125, 1.848388671875, 2.00732421875, 2.166259765625, 2.3251953125, 2.484130859375, 2.64306640625, 2.802001953125, 2.9609375, 3.119873046875, 3.27880859375, 3.437744140625, 3.5966796875, 3.755615234375, 3.91455078125, 4.073486328125, 4.232421875, 4.391357421875, 4.55029296875, 4.709228515625, 4.8681640625, 5.027099609375, 5.18603515625, 5.344970703125, 5.50390625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 4.0, 10.0, 7.0, 28.0, 25.0, 56.0, 111.0, 253.0, 732.0, 2572.0, 19625.0, 807165.0, 203765.0, 11394.0, 1857.0, 527.0, 206.0, 86.0, 50.0, 31.0, 12.0, 14.0, 5.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.97607421875, -0.9434127807617188, -0.9107513427734375, -0.8780899047851562, -0.845428466796875, -0.8127670288085938, -0.7801055908203125, -0.7474441528320312, -0.71478271484375, -0.6821212768554688, -0.6494598388671875, -0.6167984008789062, -0.584136962890625, -0.5514755249023438, -0.5188140869140625, -0.48615264892578125, -0.4534912109375, -0.42082977294921875, -0.3881683349609375, -0.35550689697265625, -0.322845458984375, -0.29018402099609375, -0.2575225830078125, -0.22486114501953125, -0.19219970703125, -0.15953826904296875, -0.1268768310546875, -0.09421539306640625, -0.061553955078125, -0.02889251708984375, 0.0037689208984375, 0.03643035888671875, 0.069091796875, 0.10175323486328125, 0.1344146728515625, 0.16707611083984375, 0.199737548828125, 0.23239898681640625, 0.2650604248046875, 0.29772186279296875, 0.33038330078125, 0.36304473876953125, 0.3957061767578125, 0.42836761474609375, 0.461029052734375, 0.49369049072265625, 0.5263519287109375, 0.5590133666992188, 0.5916748046875, 0.6243362426757812, 0.6569976806640625, 0.6896591186523438, 0.722320556640625, 0.7549819946289062, 0.7876434326171875, 0.8203048706054688, 0.85296630859375, 0.8856277465820312, 0.9182891845703125, 0.9509506225585938, 0.983612060546875, 1.0162734985351562, 1.0489349365234375, 1.0815963745117188, 1.1142578125]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 4.0, 4.0, 6.0, 9.0, 10.0, 13.0, 13.0, 19.0, 25.0, 25.0, 37.0, 42.0, 63.0, 142.0, 255.0, 113.0, 54.0, 43.0, 28.0, 19.0, 19.0, 19.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.534027099609375e-05, -7.258821278810501e-05, -6.983615458011627e-05, -6.708409637212753e-05, -6.43320381641388e-05, -6.157997995615005e-05, -5.8827921748161316e-05, -5.607586354017258e-05, -5.332380533218384e-05, -5.05717471241951e-05, -4.781968891620636e-05, -4.506763070821762e-05, -4.231557250022888e-05, -3.956351429224014e-05, -3.6811456084251404e-05, -3.4059397876262665e-05, -3.1307339668273926e-05, -2.8555281460285187e-05, -2.5803223252296448e-05, -2.305116504430771e-05, -2.029910683631897e-05, -1.754704862833023e-05, -1.4794990420341492e-05, -1.2042932212352753e-05, -9.290874004364014e-06, -6.538815796375275e-06, -3.7867575883865356e-06, -1.0346993803977966e-06, 1.7173588275909424e-06, 4.469417035579681e-06, 7.22147524356842e-06, 9.97353345155716e-06, 1.2725591659545898e-05, 1.5477649867534637e-05, 1.8229708075523376e-05, 2.0981766283512115e-05, 2.3733824491500854e-05, 2.6485882699489594e-05, 2.9237940907478333e-05, 3.198999911546707e-05, 3.474205732345581e-05, 3.749411553144455e-05, 4.024617373943329e-05, 4.299823194742203e-05, 4.5750290155410767e-05, 4.8502348363399506e-05, 5.1254406571388245e-05, 5.4006464779376984e-05, 5.675852298736572e-05, 5.951058119535446e-05, 6.22626394033432e-05, 6.501469761133194e-05, 6.776675581932068e-05, 7.051881402730942e-05, 7.327087223529816e-05, 7.60229304432869e-05, 7.877498865127563e-05, 8.152704685926437e-05, 8.427910506725311e-05, 8.703116327524185e-05, 8.978322148323059e-05, 9.253527969121933e-05, 9.528733789920807e-05, 9.803939610719681e-05, 0.00010079145431518555]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 4.0, 0.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 7.0, 5.0, 8.0, 13.0, 11.0, 19.0, 14.0, 34.0, 49.0, 79.0, 131.0, 264.0, 597.0, 1866.0, 7161.0, 45441.0, 810283.0, 159175.0, 17835.0, 3577.0, 1114.0, 372.0, 190.0, 99.0, 64.0, 29.0, 18.0, 17.0, 8.0, 11.0, 6.0, 7.0, 4.0, 5.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.6621856689453125, -0.638336181640625, -0.6144866943359375, -0.59063720703125, -0.5667877197265625, -0.542938232421875, -0.5190887451171875, -0.4952392578125, -0.4713897705078125, -0.447540283203125, -0.4236907958984375, -0.39984130859375, -0.3759918212890625, -0.352142333984375, -0.3282928466796875, -0.304443359375, -0.2805938720703125, -0.256744384765625, -0.2328948974609375, -0.20904541015625, -0.1851959228515625, -0.161346435546875, -0.1374969482421875, -0.1136474609375, -0.0897979736328125, -0.065948486328125, -0.0420989990234375, -0.01824951171875, 0.0055999755859375, 0.029449462890625, 0.0532989501953125, 0.0771484375, 0.1009979248046875, 0.124847412109375, 0.1486968994140625, 0.17254638671875, 0.1963958740234375, 0.220245361328125, 0.2440948486328125, 0.2679443359375, 0.2917938232421875, 0.315643310546875, 0.3394927978515625, 0.36334228515625, 0.3871917724609375, 0.411041259765625, 0.4348907470703125, 0.458740234375, 0.4825897216796875, 0.506439208984375, 0.5302886962890625, 0.55413818359375, 0.5779876708984375, 0.601837158203125, 0.6256866455078125, 0.6495361328125, 0.6733856201171875, 0.697235107421875, 0.7210845947265625, 0.74493408203125, 0.7687835693359375, 0.792633056640625, 0.8164825439453125, 0.84033203125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 3.0, 5.0, 2.0, 6.0, 3.0, 5.0, 7.0, 11.0, 9.0, 16.0, 16.0, 13.0, 13.0, 24.0, 26.0, 25.0, 26.0, 42.0, 50.0, 266.0, 160.0, 52.0, 28.0, 33.0, 20.0, 18.0, 18.0, 26.0, 10.0, 7.0, 7.0, 6.0, 9.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.16162109375, -0.15639495849609375, -0.1511688232421875, -0.14594268798828125, -0.140716552734375, -0.13549041748046875, -0.1302642822265625, -0.12503814697265625, -0.11981201171875, -0.11458587646484375, -0.1093597412109375, -0.10413360595703125, -0.098907470703125, -0.09368133544921875, -0.0884552001953125, -0.08322906494140625, -0.0780029296875, -0.07277679443359375, -0.0675506591796875, -0.06232452392578125, -0.057098388671875, -0.05187225341796875, -0.0466461181640625, -0.04141998291015625, -0.03619384765625, -0.03096771240234375, -0.0257415771484375, -0.02051544189453125, -0.015289306640625, -0.01006317138671875, -0.0048370361328125, 0.00038909912109375, 0.005615234375, 0.01084136962890625, 0.0160675048828125, 0.02129364013671875, 0.026519775390625, 0.03174591064453125, 0.0369720458984375, 0.04219818115234375, 0.04742431640625, 0.05265045166015625, 0.0578765869140625, 0.06310272216796875, 0.068328857421875, 0.07355499267578125, 0.0787811279296875, 0.08400726318359375, 0.0892333984375, 0.09445953369140625, 0.0996856689453125, 0.10491180419921875, 0.110137939453125, 0.11536407470703125, 0.1205902099609375, 0.12581634521484375, 0.13104248046875, 0.13626861572265625, 0.1414947509765625, 0.14672088623046875, 0.151947021484375, 0.15717315673828125, 0.1623992919921875, 0.16762542724609375, 0.1728515625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 167.0, 772.0, 65.0, 6.0, 3.0], "bins": [-84.81537628173828, -83.41034698486328, -82.00531768798828, -80.60029602050781, -79.19526672363281, -77.79023742675781, -76.38520812988281, -74.98017883300781, -73.57514953613281, -72.17012023925781, -70.76509094238281, -69.36006164550781, -67.95503997802734, -66.55001068115234, -65.14498138427734, -63.739952087402344, -62.33492660522461, -60.92989730834961, -59.524871826171875, -58.119842529296875, -56.714813232421875, -55.309783935546875, -53.90475845336914, -52.49972915649414, -51.094703674316406, -49.689674377441406, -48.28464889526367, -46.87961959838867, -45.47459030151367, -44.06956481933594, -42.66453552246094, -41.25950622558594, -39.85447692871094, -38.44944763183594, -37.0444221496582, -35.6393928527832, -34.2343635559082, -32.82933807373047, -31.42430877685547, -30.01927947998047, -28.6142520904541, -27.209224700927734, -25.804195404052734, -24.399168014526367, -22.994140625, -21.589111328125, -20.184083938598633, -18.779056549072266, -17.374027252197266, -15.968998908996582, -14.563970565795898, -13.158943176269531, -11.753914833068848, -10.348886489868164, -8.943859100341797, -7.538830757141113, -6.13380241394043, -4.728774070739746, -3.3237462043762207, -1.9187183380126953, -0.5136899948120117, 0.8913383483886719, 2.296365737915039, 3.7013940811157227, 5.106422424316406]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 6.0, 7.0, 6.0, 6.0, 5.0, 11.0, 9.0, 10.0, 14.0, 14.0, 14.0, 21.0, 27.0, 26.0, 33.0, 28.0, 34.0, 42.0, 36.0, 57.0, 41.0, 28.0, 39.0, 32.0, 39.0, 42.0, 34.0, 44.0, 35.0, 44.0, 30.0, 24.0, 27.0, 25.0, 15.0, 15.0, 15.0, 8.0, 11.0, 13.0, 13.0, 5.0, 7.0, 1.0, 5.0, 9.0, 3.0, 0.0, 2.0, 2.0], "bins": [-7.683573246002197, -7.47662878036499, -7.269683837890625, -7.062739372253418, -6.855794906616211, -6.648850440979004, -6.441905975341797, -6.234961032867432, -6.028016567230225, -5.821072101593018, -5.614127159118652, -5.407182693481445, -5.200238227844238, -4.993293762207031, -4.786349296569824, -4.579404354095459, -4.372459888458252, -4.165515422821045, -3.958570718765259, -3.7516260147094727, -3.5446815490722656, -3.3377370834350586, -3.1307923793792725, -2.9238476753234863, -2.7169032096862793, -2.5099587440490723, -2.303014039993286, -2.0960693359375, -1.889124870300293, -1.6821802854537964, -1.4752357006072998, -1.2682911157608032, -1.0613465309143066, -0.8544019460678101, -0.6474573612213135, -0.4405127763748169, -0.2335681915283203, -0.02662360668182373, 0.18032097816467285, 0.38726556301116943, 0.594210147857666, 0.8011547327041626, 1.0080993175506592, 1.2150439023971558, 1.4219884872436523, 1.628933072090149, 1.8358776569366455, 2.0428223609924316, 2.2497668266296387, 2.4567112922668457, 2.663655996322632, 2.870600700378418, 3.077545166015625, 3.284489631652832, 3.491434335708618, 3.6983790397644043, 3.9053235054016113, 4.112267971038818, 4.319212913513184, 4.526157379150391, 4.733101844787598, 4.940046310424805, 5.146990776062012, 5.353935718536377, 5.560880184173584]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 9.0, 4.0, 6.0, 11.0, 15.0, 20.0, 30.0, 56.0, 83.0, 131.0, 204.0, 388.0, 765.0, 1802.0, 4748.0, 13808.0, 59859.0, 584203.0, 3235562.0, 239446.0, 36829.0, 9807.0, 3542.0, 1442.0, 642.0, 369.0, 186.0, 99.0, 71.0, 46.0, 36.0, 22.0, 13.0, 13.0, 3.0, 8.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.52734375, -3.430267333984375, -3.33319091796875, -3.236114501953125, -3.1390380859375, -3.041961669921875, -2.94488525390625, -2.847808837890625, -2.750732421875, -2.653656005859375, -2.55657958984375, -2.459503173828125, -2.3624267578125, -2.265350341796875, -2.16827392578125, -2.071197509765625, -1.97412109375, -1.877044677734375, -1.77996826171875, -1.682891845703125, -1.5858154296875, -1.488739013671875, -1.39166259765625, -1.294586181640625, -1.197509765625, -1.100433349609375, -1.00335693359375, -0.906280517578125, -0.8092041015625, -0.712127685546875, -0.61505126953125, -0.517974853515625, -0.4208984375, -0.323822021484375, -0.22674560546875, -0.129669189453125, -0.0325927734375, 0.064483642578125, 0.16156005859375, 0.258636474609375, 0.355712890625, 0.452789306640625, 0.54986572265625, 0.646942138671875, 0.7440185546875, 0.841094970703125, 0.93817138671875, 1.035247802734375, 1.13232421875, 1.229400634765625, 1.32647705078125, 1.423553466796875, 1.5206298828125, 1.617706298828125, 1.71478271484375, 1.811859130859375, 1.908935546875, 2.006011962890625, 2.10308837890625, 2.200164794921875, 2.2972412109375, 2.394317626953125, 2.49139404296875, 2.588470458984375, 2.685546875]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 14.0, 6.0, 15.0, 19.0, 26.0, 27.0, 32.0, 44.0, 53.0, 58.0, 65.0, 70.0, 65.0, 76.0, 80.0, 63.0, 55.0, 46.0, 40.0, 32.0, 27.0, 24.0, 22.0, 5.0, 8.0, 6.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.103515625, -3.027099609375, -2.95068359375, -2.874267578125, -2.7978515625, -2.721435546875, -2.64501953125, -2.568603515625, -2.4921875, -2.415771484375, -2.33935546875, -2.262939453125, -2.1865234375, -2.110107421875, -2.03369140625, -1.957275390625, -1.880859375, -1.804443359375, -1.72802734375, -1.651611328125, -1.5751953125, -1.498779296875, -1.42236328125, -1.345947265625, -1.26953125, -1.193115234375, -1.11669921875, -1.040283203125, -0.9638671875, -0.887451171875, -0.81103515625, -0.734619140625, -0.658203125, -0.581787109375, -0.50537109375, -0.428955078125, -0.3525390625, -0.276123046875, -0.19970703125, -0.123291015625, -0.046875, 0.029541015625, 0.10595703125, 0.182373046875, 0.2587890625, 0.335205078125, 0.41162109375, 0.488037109375, 0.564453125, 0.640869140625, 0.71728515625, 0.793701171875, 0.8701171875, 0.946533203125, 1.02294921875, 1.099365234375, 1.17578125, 1.252197265625, 1.32861328125, 1.405029296875, 1.4814453125, 1.557861328125, 1.63427734375, 1.710693359375, 1.787109375]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 2.0, 6.0, 8.0, 7.0, 22.0, 47.0, 159.0, 572.0, 4176832.0, 16145.0, 328.0, 96.0, 38.0, 13.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.75, -39.67236328125, -38.5947265625, -37.51708984375, -36.439453125, -35.36181640625, -34.2841796875, -33.20654296875, -32.12890625, -31.05126953125, -29.9736328125, -28.89599609375, -27.818359375, -26.74072265625, -25.6630859375, -24.58544921875, -23.5078125, -22.43017578125, -21.3525390625, -20.27490234375, -19.197265625, -18.11962890625, -17.0419921875, -15.96435546875, -14.88671875, -13.80908203125, -12.7314453125, -11.65380859375, -10.576171875, -9.49853515625, -8.4208984375, -7.34326171875, -6.265625, -5.18798828125, -4.1103515625, -3.03271484375, -1.955078125, -0.87744140625, 0.2001953125, 1.27783203125, 2.35546875, 3.43310546875, 4.5107421875, 5.58837890625, 6.666015625, 7.74365234375, 8.8212890625, 9.89892578125, 10.9765625, 12.05419921875, 13.1318359375, 14.20947265625, 15.287109375, 16.36474609375, 17.4423828125, 18.52001953125, 19.59765625, 20.67529296875, 21.7529296875, 22.83056640625, 23.908203125, 24.98583984375, 26.0634765625, 27.14111328125, 28.21875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 9.0, 7.0, 10.0, 25.0, 32.0, 71.0, 133.0, 269.0, 709.0, 1741.0, 546.0, 263.0, 130.0, 56.0, 31.0, 28.0, 12.0, 7.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72705078125, -0.6853561401367188, -0.6436614990234375, -0.6019668579101562, -0.560272216796875, -0.5185775756835938, -0.4768829345703125, -0.43518829345703125, -0.39349365234375, -0.35179901123046875, -0.3101043701171875, -0.26840972900390625, -0.226715087890625, -0.18502044677734375, -0.1433258056640625, -0.10163116455078125, -0.0599365234375, -0.01824188232421875, 0.0234527587890625, 0.06514739990234375, 0.106842041015625, 0.14853668212890625, 0.1902313232421875, 0.23192596435546875, 0.27362060546875, 0.31531524658203125, 0.3570098876953125, 0.39870452880859375, 0.440399169921875, 0.48209381103515625, 0.5237884521484375, 0.5654830932617188, 0.607177734375, 0.6488723754882812, 0.6905670166015625, 0.7322616577148438, 0.773956298828125, 0.8156509399414062, 0.8573455810546875, 0.8990402221679688, 0.94073486328125, 0.9824295043945312, 1.0241241455078125, 1.0658187866210938, 1.107513427734375, 1.1492080688476562, 1.1909027099609375, 1.2325973510742188, 1.2742919921875, 1.3159866333007812, 1.3576812744140625, 1.3993759155273438, 1.441070556640625, 1.4827651977539062, 1.5244598388671875, 1.5661544799804688, 1.60784912109375, 1.6495437622070312, 1.6912384033203125, 1.7329330444335938, 1.774627685546875, 1.8163223266601562, 1.8580169677734375, 1.8997116088867188, 1.94140625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 7.0, 7.0, 10.0, 11.0, 17.0, 47.0, 71.0, 124.0, 201.0, 212.0, 127.0, 74.0, 44.0, 21.0, 11.0, 9.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.4368205070495605, -6.26836633682251, -6.099912166595459, -5.93145751953125, -5.763003349304199, -5.594549179077148, -5.426095008850098, -5.257640838623047, -5.089186668395996, -4.920732498168945, -4.7522783279418945, -4.583824157714844, -4.415369510650635, -4.246915340423584, -4.078461170196533, -3.9100069999694824, -3.7415523529052734, -3.5730981826782227, -3.4046437740325928, -3.236189603805542, -3.067735195159912, -2.8992810249328613, -2.7308268547058105, -2.5623726844787598, -2.39391827583313, -2.225464105606079, -2.057009696960449, -1.8885555267333984, -1.720101237297058, -1.5516469478607178, -1.383192777633667, -1.2147384881973267, -1.0462837219238281, -0.8778294324874878, -0.7093752026557922, -0.5409209728240967, -0.37246668338775635, -0.20401239395141602, -0.035558223724365234, 0.1328960657119751, 0.30135035514831543, 0.4698046147823334, 0.6382588744163513, 0.8067131042480469, 0.9751673936843872, 1.1436216831207275, 1.3120758533477783, 1.4805301427841187, 1.648984432220459, 1.8174387216567993, 1.9858930110931396, 2.1543471813201904, 2.3228015899658203, 2.491255760192871, 2.659709930419922, 2.8281641006469727, 2.9966185092926025, 3.1650726795196533, 3.333527088165283, 3.501981258392334, 3.6704354286193848, 3.8388898372650146, 4.0073442459106445, 4.175798416137695, 4.344252586364746]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 3.0, 12.0, 13.0, 15.0, 15.0, 28.0, 17.0, 24.0, 34.0, 39.0, 37.0, 37.0, 59.0, 52.0, 54.0, 58.0, 58.0, 45.0, 59.0, 45.0, 47.0, 45.0, 44.0, 26.0, 29.0, 14.0, 18.0, 10.0, 10.0, 12.0, 10.0, 3.0, 4.0, 5.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.319945812225342, -2.254977226257324, -2.1900088787078857, -2.125040292739868, -2.0600717067718506, -1.9951032400131226, -1.9301347732543945, -1.865166187286377, -1.800197720527649, -1.735229253768921, -1.6702606678009033, -1.6052922010421753, -1.5403237342834473, -1.4753551483154297, -1.4103866815567017, -1.3454182147979736, -1.280449628829956, -1.215481162071228, -1.1505125761032104, -1.0855441093444824, -1.0205755233764648, -0.9556070566177368, -0.8906385898590088, -0.825670063495636, -0.7607015371322632, -0.6957330107688904, -0.6307644844055176, -0.5657960176467896, -0.5008274912834167, -0.43585896492004395, -0.37089046835899353, -0.3059219717979431, -0.24095332622528076, -0.17598481476306915, -0.11101630330085754, -0.046047791838645935, 0.018920719623565674, 0.08388924598693848, 0.1488577425479889, 0.2138262391090393, 0.2787947654724121, 0.3437632918357849, 0.4087317883968353, 0.47370028495788574, 0.5386688113212585, 0.6036373376846313, 0.6686058044433594, 0.7335743308067322, 0.798542857170105, 0.8635113835334778, 0.9284799098968506, 0.9934483766555786, 1.0584168434143066, 1.1233854293823242, 1.1883538961410522, 1.2533223628997803, 1.3182909488677979, 1.3832594156265259, 1.4482280015945435, 1.5131964683532715, 1.578165054321289, 1.643133521080017, 1.7081019878387451, 1.7730705738067627, 1.8380390405654907]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 4.0, 9.0, 12.0, 14.0, 24.0, 50.0, 52.0, 94.0, 174.0, 260.0, 427.0, 732.0, 1517.0, 4156.0, 31778.0, 845750.0, 150414.0, 8504.0, 2165.0, 992.0, 585.0, 328.0, 168.0, 122.0, 80.0, 51.0, 22.0, 21.0, 20.0, 10.0, 7.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62158203125, -0.6031494140625, -0.584716796875, -0.5662841796875, -0.5478515625, -0.5294189453125, -0.510986328125, -0.4925537109375, -0.47412109375, -0.4556884765625, -0.437255859375, -0.4188232421875, -0.400390625, -0.3819580078125, -0.363525390625, -0.3450927734375, -0.32666015625, -0.3082275390625, -0.289794921875, -0.2713623046875, -0.2529296875, -0.2344970703125, -0.216064453125, -0.1976318359375, -0.17919921875, -0.1607666015625, -0.142333984375, -0.1239013671875, -0.10546875, -0.0870361328125, -0.068603515625, -0.0501708984375, -0.03173828125, -0.0133056640625, 0.005126953125, 0.0235595703125, 0.0419921875, 0.0604248046875, 0.078857421875, 0.0972900390625, 0.11572265625, 0.1341552734375, 0.152587890625, 0.1710205078125, 0.189453125, 0.2078857421875, 0.226318359375, 0.2447509765625, 0.26318359375, 0.2816162109375, 0.300048828125, 0.3184814453125, 0.3369140625, 0.3553466796875, 0.373779296875, 0.3922119140625, 0.41064453125, 0.4290771484375, 0.447509765625, 0.4659423828125, 0.484375, 0.5028076171875, 0.521240234375, 0.5396728515625, 0.55810546875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 4.0, 1.0, 5.0, 7.0, 4.0, 6.0, 12.0, 18.0, 18.0, 34.0, 35.0, 29.0, 52.0, 53.0, 68.0, 76.0, 75.0, 77.0, 84.0, 64.0, 52.0, 46.0, 47.0, 30.0, 35.0, 17.0, 15.0, 20.0, 6.0, 3.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.5859375, -2.524444580078125, -2.46295166015625, -2.401458740234375, -2.3399658203125, -2.278472900390625, -2.21697998046875, -2.155487060546875, -2.093994140625, -2.032501220703125, -1.97100830078125, -1.909515380859375, -1.8480224609375, -1.786529541015625, -1.72503662109375, -1.663543701171875, -1.60205078125, -1.540557861328125, -1.47906494140625, -1.417572021484375, -1.3560791015625, -1.294586181640625, -1.23309326171875, -1.171600341796875, -1.110107421875, -1.048614501953125, -0.98712158203125, -0.925628662109375, -0.8641357421875, -0.802642822265625, -0.74114990234375, -0.679656982421875, -0.6181640625, -0.556671142578125, -0.49517822265625, -0.433685302734375, -0.3721923828125, -0.310699462890625, -0.24920654296875, -0.187713623046875, -0.126220703125, -0.064727783203125, -0.00323486328125, 0.058258056640625, 0.1197509765625, 0.181243896484375, 0.24273681640625, 0.304229736328125, 0.36572265625, 0.427215576171875, 0.48870849609375, 0.550201416015625, 0.6116943359375, 0.673187255859375, 0.73468017578125, 0.796173095703125, 0.857666015625, 0.919158935546875, 0.98065185546875, 1.042144775390625, 1.1036376953125, 1.165130615234375, 1.22662353515625, 1.288116455078125, 1.349609375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 6.0, 4.0, 2.0, 2.0, 7.0, 7.0, 10.0, 5.0, 11.0, 11.0, 16.0, 22.0, 40.0, 42.0, 52.0, 69.0, 94.0, 113.0, 145.0, 226.0, 347.0, 788.0, 2334.0, 11323.0, 85009.0, 692585.0, 224495.0, 24235.0, 4158.0, 1038.0, 410.0, 228.0, 186.0, 119.0, 99.0, 74.0, 53.0, 29.0, 36.0, 34.0, 30.0, 17.0, 12.0, 10.0, 5.0, 9.0, 3.0, 7.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2188720703125, -0.21237754821777344, -0.20588302612304688, -0.1993885040283203, -0.19289398193359375, -0.1863994598388672, -0.17990493774414062, -0.17341041564941406, -0.1669158935546875, -0.16042137145996094, -0.15392684936523438, -0.1474323272705078, -0.14093780517578125, -0.1344432830810547, -0.12794876098632812, -0.12145423889160156, -0.114959716796875, -0.10846519470214844, -0.10197067260742188, -0.09547615051269531, -0.08898162841796875, -0.08248710632324219, -0.07599258422851562, -0.06949806213378906, -0.0630035400390625, -0.05650901794433594, -0.050014495849609375, -0.04351997375488281, -0.03702545166015625, -0.030530929565429688, -0.024036407470703125, -0.017541885375976562, -0.01104736328125, -0.0045528411865234375, 0.001941680908203125, 0.008436203002929688, 0.01493072509765625, 0.021425247192382812, 0.027919769287109375, 0.03441429138183594, 0.0409088134765625, 0.04740333557128906, 0.053897857666015625, 0.06039237976074219, 0.06688690185546875, 0.07338142395019531, 0.07987594604492188, 0.08637046813964844, 0.092864990234375, 0.09935951232910156, 0.10585403442382812, 0.11234855651855469, 0.11884307861328125, 0.1253376007080078, 0.13183212280273438, 0.13832664489746094, 0.1448211669921875, 0.15131568908691406, 0.15781021118164062, 0.1643047332763672, 0.17079925537109375, 0.1772937774658203, 0.18378829956054688, 0.19028282165527344, 0.19677734375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 1.0, 5.0, 3.0, 9.0, 7.0, 4.0, 6.0, 13.0, 14.0, 27.0, 18.0, 21.0, 17.0, 28.0, 25.0, 45.0, 33.0, 40.0, 37.0, 45.0, 50.0, 49.0, 27.0, 42.0, 49.0, 38.0, 46.0, 32.0, 27.0, 40.0, 28.0, 30.0, 19.0, 20.0, 12.0, 12.0, 19.0, 10.0, 11.0, 12.0, 6.0, 7.0, 7.0, 2.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-2.4609375, -2.3931427001953125, -2.325347900390625, -2.2575531005859375, -2.18975830078125, -2.1219635009765625, -2.054168701171875, -1.9863739013671875, -1.9185791015625, -1.8507843017578125, -1.782989501953125, -1.7151947021484375, -1.64739990234375, -1.5796051025390625, -1.511810302734375, -1.4440155029296875, -1.376220703125, -1.3084259033203125, -1.240631103515625, -1.1728363037109375, -1.10504150390625, -1.0372467041015625, -0.969451904296875, -0.9016571044921875, -0.8338623046875, -0.7660675048828125, -0.698272705078125, -0.6304779052734375, -0.56268310546875, -0.4948883056640625, -0.427093505859375, -0.3592987060546875, -0.29150390625, -0.2237091064453125, -0.155914306640625, -0.0881195068359375, -0.02032470703125, 0.0474700927734375, 0.115264892578125, 0.1830596923828125, 0.2508544921875, 0.3186492919921875, 0.386444091796875, 0.4542388916015625, 0.52203369140625, 0.5898284912109375, 0.657623291015625, 0.7254180908203125, 0.793212890625, 0.8610076904296875, 0.928802490234375, 0.9965972900390625, 1.06439208984375, 1.1321868896484375, 1.199981689453125, 1.2677764892578125, 1.3355712890625, 1.4033660888671875, 1.471160888671875, 1.5389556884765625, 1.60675048828125, 1.6745452880859375, 1.742340087890625, 1.8101348876953125, 1.8779296875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 6.0, 6.0, 8.0, 9.0, 17.0, 15.0, 24.0, 44.0, 71.0, 125.0, 174.0, 334.0, 528.0, 1033.0, 3256.0, 26448.0, 887197.0, 119603.0, 6427.0, 1585.0, 666.0, 367.0, 204.0, 146.0, 74.0, 49.0, 37.0, 29.0, 13.0, 14.0, 13.0, 10.0, 7.0, 2.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0304107666015625, -0.02927231788635254, -0.028133869171142578, -0.026995420455932617, -0.025856971740722656, -0.024718523025512695, -0.023580074310302734, -0.022441625595092773, -0.021303176879882812, -0.02016472816467285, -0.01902627944946289, -0.01788783073425293, -0.01674938201904297, -0.015610933303833008, -0.014472484588623047, -0.013334035873413086, -0.012195587158203125, -0.011057138442993164, -0.009918689727783203, -0.008780241012573242, -0.007641792297363281, -0.00650334358215332, -0.005364894866943359, -0.0042264461517333984, -0.0030879974365234375, -0.0019495487213134766, -0.0008111000061035156, 0.0003273487091064453, 0.0014657974243164062, 0.002604246139526367, 0.003742694854736328, 0.004881143569946289, 0.00601959228515625, 0.007158041000366211, 0.008296489715576172, 0.009434938430786133, 0.010573387145996094, 0.011711835861206055, 0.012850284576416016, 0.013988733291625977, 0.015127182006835938, 0.0162656307220459, 0.01740407943725586, 0.01854252815246582, 0.01968097686767578, 0.020819425582885742, 0.021957874298095703, 0.023096323013305664, 0.024234771728515625, 0.025373220443725586, 0.026511669158935547, 0.027650117874145508, 0.02878856658935547, 0.02992701530456543, 0.03106546401977539, 0.03220391273498535, 0.03334236145019531, 0.03448081016540527, 0.035619258880615234, 0.036757707595825195, 0.037896156311035156, 0.03903460502624512, 0.04017305374145508, 0.04131150245666504, 0.042449951171875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 5.0, 11.0, 11.0, 12.0, 20.0, 35.0, 72.0, 80.0, 118.0, 160.0, 144.0, 120.0, 83.0, 50.0, 28.0, 20.0, 8.0, 10.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.4689903259277344e-05, -3.377348184585571e-05, -3.285706043243408e-05, -3.194063901901245e-05, -3.102421760559082e-05, -3.010779619216919e-05, -2.919137477874756e-05, -2.8274953365325928e-05, -2.7358531951904297e-05, -2.6442110538482666e-05, -2.5525689125061035e-05, -2.4609267711639404e-05, -2.3692846298217773e-05, -2.2776424884796143e-05, -2.1860003471374512e-05, -2.094358205795288e-05, -2.002716064453125e-05, -1.911073923110962e-05, -1.8194317817687988e-05, -1.7277896404266357e-05, -1.6361474990844727e-05, -1.5445053577423096e-05, -1.4528632164001465e-05, -1.3612210750579834e-05, -1.2695789337158203e-05, -1.1779367923736572e-05, -1.0862946510314941e-05, -9.94652509689331e-06, -9.03010368347168e-06, -8.113682270050049e-06, -7.197260856628418e-06, -6.280839443206787e-06, -5.364418029785156e-06, -4.447996616363525e-06, -3.5315752029418945e-06, -2.6151537895202637e-06, -1.6987323760986328e-06, -7.82310962677002e-07, 1.341104507446289e-07, 1.0505318641662598e-06, 1.9669532775878906e-06, 2.8833746910095215e-06, 3.7997961044311523e-06, 4.716217517852783e-06, 5.632638931274414e-06, 6.549060344696045e-06, 7.465481758117676e-06, 8.381903171539307e-06, 9.298324584960938e-06, 1.0214745998382568e-05, 1.11311674118042e-05, 1.204758882522583e-05, 1.2964010238647461e-05, 1.3880431652069092e-05, 1.4796853065490723e-05, 1.5713274478912354e-05, 1.6629695892333984e-05, 1.7546117305755615e-05, 1.8462538719177246e-05, 1.9378960132598877e-05, 2.0295381546020508e-05, 2.121180295944214e-05, 2.212822437286377e-05, 2.30446457862854e-05, 2.396106719970703e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 2.0, 4.0, 9.0, 7.0, 10.0, 21.0, 26.0, 24.0, 71.0, 122.0, 571.0, 5766.0, 860713.0, 177299.0, 3220.0, 405.0, 120.0, 52.0, 26.0, 17.0, 13.0, 17.0, 12.0, 7.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11846923828125, -0.11475467681884766, -0.11104011535644531, -0.10732555389404297, -0.10361099243164062, -0.09989643096923828, -0.09618186950683594, -0.0924673080444336, -0.08875274658203125, -0.0850381851196289, -0.08132362365722656, -0.07760906219482422, -0.07389450073242188, -0.07017993927001953, -0.06646537780761719, -0.06275081634521484, -0.0590362548828125, -0.055321693420410156, -0.05160713195800781, -0.04789257049560547, -0.044178009033203125, -0.04046344757080078, -0.03674888610839844, -0.033034324645996094, -0.02931976318359375, -0.025605201721191406, -0.021890640258789062, -0.01817607879638672, -0.014461517333984375, -0.010746955871582031, -0.0070323944091796875, -0.0033178329467773438, 0.000396728515625, 0.004111289978027344, 0.007825851440429688, 0.011540412902832031, 0.015254974365234375, 0.01896953582763672, 0.022684097290039062, 0.026398658752441406, 0.03011322021484375, 0.033827781677246094, 0.03754234313964844, 0.04125690460205078, 0.044971466064453125, 0.04868602752685547, 0.05240058898925781, 0.056115150451660156, 0.0598297119140625, 0.06354427337646484, 0.06725883483886719, 0.07097339630126953, 0.07468795776367188, 0.07840251922607422, 0.08211708068847656, 0.0858316421508789, 0.08954620361328125, 0.0932607650756836, 0.09697532653808594, 0.10068988800048828, 0.10440444946289062, 0.10811901092529297, 0.11183357238769531, 0.11554813385009766, 0.1192626953125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 7.0, 7.0, 5.0, 10.0, 14.0, 34.0, 55.0, 68.0, 107.0, 146.0, 158.0, 124.0, 69.0, 55.0, 38.0, 24.0, 22.0, 18.0, 6.0, 7.0, 4.0, 0.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007061004638671875, -0.006835043430328369, -0.006609082221984863, -0.006383121013641357, -0.0061571598052978516, -0.005931198596954346, -0.00570523738861084, -0.005479276180267334, -0.005253314971923828, -0.005027353763580322, -0.004801392555236816, -0.0045754313468933105, -0.004349470138549805, -0.004123508930206299, -0.003897547721862793, -0.003671586513519287, -0.0034456253051757812, -0.0032196640968322754, -0.0029937028884887695, -0.0027677416801452637, -0.002541780471801758, -0.002315819263458252, -0.002089858055114746, -0.0018638968467712402, -0.0016379356384277344, -0.0014119744300842285, -0.0011860132217407227, -0.0009600520133972168, -0.0007340908050537109, -0.0005081295967102051, -0.0002821683883666992, -5.620718002319336e-05, 0.0001697540283203125, 0.00039571523666381836, 0.0006216764450073242, 0.0008476376533508301, 0.001073598861694336, 0.0012995600700378418, 0.0015255212783813477, 0.0017514824867248535, 0.0019774436950683594, 0.0022034049034118652, 0.002429366111755371, 0.002655327320098877, 0.002881288528442383, 0.0031072497367858887, 0.0033332109451293945, 0.0035591721534729004, 0.0037851333618164062, 0.004011094570159912, 0.004237055778503418, 0.004463016986846924, 0.00468897819519043, 0.0049149394035339355, 0.005140900611877441, 0.005366861820220947, 0.005592823028564453, 0.005818784236907959, 0.006044745445251465, 0.006270706653594971, 0.0064966678619384766, 0.006722629070281982, 0.006948590278625488, 0.007174551486968994, 0.0074005126953125]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 3.0, 7.0, 6.0, 10.0, 19.0, 23.0, 54.0, 60.0, 123.0, 167.0, 186.0, 134.0, 84.0, 42.0, 30.0, 15.0, 10.0, 10.0, 7.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9169973134994507, -1.821810007095337, -1.7266225814819336, -1.6314352750778198, -1.536247968673706, -1.4410605430603027, -1.345873236656189, -1.2506859302520752, -1.1554985046386719, -1.060311198234558, -0.9651237726211548, -0.869936466217041, -0.7747491002082825, -0.6795617341995239, -0.5843744277954102, -0.4891870617866516, -0.39399969577789307, -0.2988123297691345, -0.20362499356269836, -0.10843765735626221, -0.013250291347503662, 0.08193707466125488, 0.17712438106536865, 0.2723117470741272, 0.36749911308288574, 0.4626864790916443, 0.5578738451004028, 0.6530611515045166, 0.7482485175132751, 0.8434358835220337, 0.9386231899261475, 1.0338106155395508, 1.128997802734375, 1.2241851091384888, 1.319372534751892, 1.4145598411560059, 1.5097472667694092, 1.604934573173523, 1.7001218795776367, 1.79530930519104, 1.8904966115951538, 1.9856839179992676, 2.080871343612671, 2.176058769226074, 2.2712459564208984, 2.3664333820343018, 2.461620807647705, 2.5568079948425293, 2.6519954204559326, 2.747182846069336, 2.84237003326416, 2.9375574588775635, 3.032744884490967, 3.127932071685791, 3.2231194972991943, 3.3183069229125977, 3.413494110107422, 3.508681535720825, 3.6038687229156494, 3.6990561485290527, 3.794243574142456, 3.8894309997558594, 3.9846181869506836, 4.079805374145508, 4.17499303817749]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 10.0, 5.0, 5.0, 13.0, 15.0, 22.0, 20.0, 23.0, 36.0, 27.0, 53.0, 47.0, 47.0, 67.0, 70.0, 63.0, 65.0, 60.0, 64.0, 53.0, 54.0, 37.0, 38.0, 21.0, 14.0, 19.0, 7.0, 10.0, 11.0, 9.0, 4.0, 3.0, 4.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.8298665285110474, -1.7795535326004028, -1.7292405366897583, -1.6789274215698242, -1.6286144256591797, -1.5783014297485352, -1.5279884338378906, -1.477675437927246, -1.4273624420166016, -1.377049446105957, -1.3267364501953125, -1.276423454284668, -1.2261103391647339, -1.1757973432540894, -1.1254843473434448, -1.0751713514328003, -1.0248582363128662, -0.9745452404022217, -0.9242321848869324, -0.8739191889762878, -0.8236061930656433, -0.773293137550354, -0.7229801416397095, -0.6726671457290649, -0.6223541498184204, -0.5720411539077759, -0.5217280983924866, -0.47141510248184204, -0.4211021065711975, -0.3707890808582306, -0.32047605514526367, -0.27016305923461914, -0.2198500633239746, -0.16953705251216888, -0.11922403424978256, -0.06891101598739624, -0.018598005175590515, 0.03171500563621521, 0.08202803134918213, 0.13234102725982666, 0.18265405297279358, 0.2329670637845993, 0.28328007459640503, 0.33359310030937195, 0.38390612602233887, 0.4342191219329834, 0.4845321476459503, 0.5348451137542725, 0.5851581692695618, 0.6354711651802063, 0.6857842206954956, 0.7360972166061401, 0.7864102125167847, 0.8367232084274292, 0.8870362639427185, 0.937349259853363, 0.9876623153686523, 1.0379753112792969, 1.0882883071899414, 1.138601303100586, 1.18891441822052, 1.2392274141311646, 1.289540410041809, 1.3398534059524536, 1.3901664018630981]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 7.0, 8.0, 4.0, 8.0, 21.0, 24.0, 51.0, 72.0, 140.0, 217.0, 420.0, 810.0, 1651.0, 3762.0, 9241.0, 27965.0, 216587.0, 711638.0, 51948.0, 13910.0, 5336.0, 2367.0, 1112.0, 579.0, 270.0, 159.0, 108.0, 49.0, 24.0, 26.0, 6.0, 9.0, 6.0, 3.0, 4.0, 4.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6884765625, -1.63604736328125, -1.5836181640625, -1.53118896484375, -1.478759765625, -1.42633056640625, -1.3739013671875, -1.32147216796875, -1.26904296875, -1.21661376953125, -1.1641845703125, -1.11175537109375, -1.059326171875, -1.00689697265625, -0.9544677734375, -0.90203857421875, -0.849609375, -0.79718017578125, -0.7447509765625, -0.69232177734375, -0.639892578125, -0.58746337890625, -0.5350341796875, -0.48260498046875, -0.43017578125, -0.37774658203125, -0.3253173828125, -0.27288818359375, -0.220458984375, -0.16802978515625, -0.1156005859375, -0.06317138671875, -0.0107421875, 0.04168701171875, 0.0941162109375, 0.14654541015625, 0.198974609375, 0.25140380859375, 0.3038330078125, 0.35626220703125, 0.40869140625, 0.46112060546875, 0.5135498046875, 0.56597900390625, 0.618408203125, 0.67083740234375, 0.7232666015625, 0.77569580078125, 0.828125, 0.88055419921875, 0.9329833984375, 0.98541259765625, 1.037841796875, 1.09027099609375, 1.1427001953125, 1.19512939453125, 1.24755859375, 1.29998779296875, 1.3524169921875, 1.40484619140625, 1.457275390625, 1.50970458984375, 1.5621337890625, 1.61456298828125, 1.6669921875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 5.0, 9.0, 19.0, 16.0, 18.0, 32.0, 31.0, 29.0, 50.0, 61.0, 50.0, 70.0, 66.0, 71.0, 70.0, 70.0, 68.0, 65.0, 43.0, 37.0, 29.0, 21.0, 13.0, 14.0, 8.0, 6.0, 10.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.671875, -2.5570068359375, -2.442138671875, -2.3272705078125, -2.21240234375, -2.0975341796875, -1.982666015625, -1.8677978515625, -1.7529296875, -1.6380615234375, -1.523193359375, -1.4083251953125, -1.29345703125, -1.1785888671875, -1.063720703125, -0.9488525390625, -0.833984375, -0.7191162109375, -0.604248046875, -0.4893798828125, -0.37451171875, -0.2596435546875, -0.144775390625, -0.0299072265625, 0.0849609375, 0.1998291015625, 0.314697265625, 0.4295654296875, 0.54443359375, 0.6593017578125, 0.774169921875, 0.8890380859375, 1.00390625, 1.1187744140625, 1.233642578125, 1.3485107421875, 1.46337890625, 1.5782470703125, 1.693115234375, 1.8079833984375, 1.9228515625, 2.0377197265625, 2.152587890625, 2.2674560546875, 2.38232421875, 2.4971923828125, 2.612060546875, 2.7269287109375, 2.841796875, 2.9566650390625, 3.071533203125, 3.1864013671875, 3.30126953125, 3.4161376953125, 3.531005859375, 3.6458740234375, 3.7607421875, 3.8756103515625, 3.990478515625, 4.1053466796875, 4.22021484375, 4.3350830078125, 4.449951171875, 4.5648193359375, 4.6796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 4.0, 12.0, 14.0, 5.0, 29.0, 29.0, 37.0, 40.0, 52.0, 51.0, 86.0, 201.0, 20870.0, 1026201.0, 488.0, 91.0, 63.0, 61.0, 49.0, 45.0, 33.0, 29.0, 17.0, 7.0, 16.0, 6.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2109375, -13.782470703125, -13.35400390625, -12.925537109375, -12.4970703125, -12.068603515625, -11.64013671875, -11.211669921875, -10.783203125, -10.354736328125, -9.92626953125, -9.497802734375, -9.0693359375, -8.640869140625, -8.21240234375, -7.783935546875, -7.35546875, -6.927001953125, -6.49853515625, -6.070068359375, -5.6416015625, -5.213134765625, -4.78466796875, -4.356201171875, -3.927734375, -3.499267578125, -3.07080078125, -2.642333984375, -2.2138671875, -1.785400390625, -1.35693359375, -0.928466796875, -0.5, -0.071533203125, 0.35693359375, 0.785400390625, 1.2138671875, 1.642333984375, 2.07080078125, 2.499267578125, 2.927734375, 3.356201171875, 3.78466796875, 4.213134765625, 4.6416015625, 5.070068359375, 5.49853515625, 5.927001953125, 6.35546875, 6.783935546875, 7.21240234375, 7.640869140625, 8.0693359375, 8.497802734375, 8.92626953125, 9.354736328125, 9.783203125, 10.211669921875, 10.64013671875, 11.068603515625, 11.4970703125, 11.925537109375, 12.35400390625, 12.782470703125, 13.2109375]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 5.0, 5.0, 7.0, 14.0, 11.0, 10.0, 27.0, 31.0, 35.0, 39.0, 54.0, 42.0, 59.0, 62.0, 82.0, 74.0, 69.0, 46.0, 55.0, 63.0, 43.0, 50.0, 35.0, 27.0, 20.0, 6.0, 15.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9609375, -4.81134033203125, -4.6617431640625, -4.51214599609375, -4.362548828125, -4.21295166015625, -4.0633544921875, -3.91375732421875, -3.76416015625, -3.61456298828125, -3.4649658203125, -3.31536865234375, -3.165771484375, -3.01617431640625, -2.8665771484375, -2.71697998046875, -2.5673828125, -2.41778564453125, -2.2681884765625, -2.11859130859375, -1.968994140625, -1.81939697265625, -1.6697998046875, -1.52020263671875, -1.37060546875, -1.22100830078125, -1.0714111328125, -0.92181396484375, -0.772216796875, -0.62261962890625, -0.4730224609375, -0.32342529296875, -0.173828125, -0.02423095703125, 0.1253662109375, 0.27496337890625, 0.424560546875, 0.57415771484375, 0.7237548828125, 0.87335205078125, 1.02294921875, 1.17254638671875, 1.3221435546875, 1.47174072265625, 1.621337890625, 1.77093505859375, 1.9205322265625, 2.07012939453125, 2.2197265625, 2.36932373046875, 2.5189208984375, 2.66851806640625, 2.818115234375, 2.96771240234375, 3.1173095703125, 3.26690673828125, 3.41650390625, 3.56610107421875, 3.7156982421875, 3.86529541015625, 4.014892578125, 4.16448974609375, 4.3140869140625, 4.46368408203125, 4.61328125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 5.0, 5.0, 9.0, 15.0, 16.0, 26.0, 26.0, 62.0, 110.0, 171.0, 366.0, 870.0, 2609.0, 10115.0, 68813.0, 899315.0, 53529.0, 8659.0, 2263.0, 773.0, 360.0, 141.0, 116.0, 71.0, 26.0, 18.0, 19.0, 8.0, 8.0, 6.0, 8.0, 6.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9013671875, -0.8772964477539062, -0.8532257080078125, -0.8291549682617188, -0.805084228515625, -0.7810134887695312, -0.7569427490234375, -0.7328720092773438, -0.70880126953125, -0.6847305297851562, -0.6606597900390625, -0.6365890502929688, -0.612518310546875, -0.5884475708007812, -0.5643768310546875, -0.5403060913085938, -0.5162353515625, -0.49216461181640625, -0.4680938720703125, -0.44402313232421875, -0.419952392578125, -0.39588165283203125, -0.3718109130859375, -0.34774017333984375, -0.32366943359375, -0.29959869384765625, -0.2755279541015625, -0.25145721435546875, -0.227386474609375, -0.20331573486328125, -0.1792449951171875, -0.15517425537109375, -0.131103515625, -0.10703277587890625, -0.0829620361328125, -0.05889129638671875, -0.034820556640625, -0.01074981689453125, 0.0133209228515625, 0.03739166259765625, 0.06146240234375, 0.08553314208984375, 0.1096038818359375, 0.13367462158203125, 0.157745361328125, 0.18181610107421875, 0.2058868408203125, 0.22995758056640625, 0.2540283203125, 0.27809906005859375, 0.3021697998046875, 0.32624053955078125, 0.350311279296875, 0.37438201904296875, 0.3984527587890625, 0.42252349853515625, 0.44659423828125, 0.47066497802734375, 0.4947357177734375, 0.5188064575195312, 0.542877197265625, 0.5669479370117188, 0.5910186767578125, 0.6150894165039062, 0.63916015625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 14.0, 15.0, 20.0, 35.0, 121.0, 416.0, 205.0, 62.0, 39.0, 22.0, 10.0, 14.0, 8.0, 4.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00020003318786621094, -0.00019574910402297974, -0.00019146502017974854, -0.00018718093633651733, -0.00018289685249328613, -0.00017861276865005493, -0.00017432868480682373, -0.00017004460096359253, -0.00016576051712036133, -0.00016147643327713013, -0.00015719234943389893, -0.00015290826559066772, -0.00014862418174743652, -0.00014434009790420532, -0.00014005601406097412, -0.00013577193021774292, -0.00013148784637451172, -0.00012720376253128052, -0.00012291967868804932, -0.00011863559484481812, -0.00011435151100158691, -0.00011006742715835571, -0.00010578334331512451, -0.00010149925947189331, -9.721517562866211e-05, -9.293109178543091e-05, -8.864700794219971e-05, -8.43629240989685e-05, -8.00788402557373e-05, -7.57947564125061e-05, -7.15106725692749e-05, -6.72265887260437e-05, -6.29425048828125e-05, -5.86584210395813e-05, -5.43743371963501e-05, -5.0090253353118896e-05, -4.5806169509887695e-05, -4.1522085666656494e-05, -3.723800182342529e-05, -3.295391798019409e-05, -2.866983413696289e-05, -2.438575029373169e-05, -2.0101666450500488e-05, -1.5817582607269287e-05, -1.1533498764038086e-05, -7.249414920806885e-06, -2.9653310775756836e-06, 1.3187527656555176e-06, 5.602836608886719e-06, 9.88692045211792e-06, 1.4171004295349121e-05, 1.8455088138580322e-05, 2.2739171981811523e-05, 2.7023255825042725e-05, 3.1307339668273926e-05, 3.559142351150513e-05, 3.987550735473633e-05, 4.415959119796753e-05, 4.844367504119873e-05, 5.272775888442993e-05, 5.701184272766113e-05, 6.129592657089233e-05, 6.558001041412354e-05, 6.986409425735474e-05, 7.414817810058594e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 5.0, 3.0, 13.0, 23.0, 28.0, 44.0, 101.0, 137.0, 233.0, 504.0, 1032.0, 3040.0, 9958.0, 45592.0, 868516.0, 96423.0, 15639.0, 4366.0, 1556.0, 648.0, 305.0, 153.0, 82.0, 39.0, 32.0, 29.0, 17.0, 9.0, 10.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8193359375, -0.7969894409179688, -0.7746429443359375, -0.7522964477539062, -0.729949951171875, -0.7076034545898438, -0.6852569580078125, -0.6629104614257812, -0.64056396484375, -0.6182174682617188, -0.5958709716796875, -0.5735244750976562, -0.551177978515625, -0.5288314819335938, -0.5064849853515625, -0.48413848876953125, -0.4617919921875, -0.43944549560546875, -0.4170989990234375, -0.39475250244140625, -0.372406005859375, -0.35005950927734375, -0.3277130126953125, -0.30536651611328125, -0.28302001953125, -0.26067352294921875, -0.2383270263671875, -0.21598052978515625, -0.193634033203125, -0.17128753662109375, -0.1489410400390625, -0.12659454345703125, -0.104248046875, -0.08190155029296875, -0.0595550537109375, -0.03720855712890625, -0.014862060546875, 0.00748443603515625, 0.0298309326171875, 0.05217742919921875, 0.07452392578125, 0.09687042236328125, 0.1192169189453125, 0.14156341552734375, 0.163909912109375, 0.18625640869140625, 0.2086029052734375, 0.23094940185546875, 0.2532958984375, 0.27564239501953125, 0.2979888916015625, 0.32033538818359375, 0.342681884765625, 0.36502838134765625, 0.3873748779296875, 0.40972137451171875, 0.43206787109375, 0.45441436767578125, 0.4767608642578125, 0.49910736083984375, 0.521453857421875, 0.5438003540039062, 0.5661468505859375, 0.5884933471679688, 0.61083984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 3.0, 5.0, 3.0, 6.0, 2.0, 5.0, 11.0, 8.0, 19.0, 34.0, 43.0, 57.0, 139.0, 387.0, 93.0, 48.0, 49.0, 17.0, 17.0, 11.0, 10.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.229248046875, -0.22168350219726562, -0.21411895751953125, -0.20655441284179688, -0.1989898681640625, -0.19142532348632812, -0.18386077880859375, -0.17629623413085938, -0.168731689453125, -0.16116714477539062, -0.15360260009765625, -0.14603805541992188, -0.1384735107421875, -0.13090896606445312, -0.12334442138671875, -0.11577987670898438, -0.10821533203125, -0.10065078735351562, -0.09308624267578125, -0.08552169799804688, -0.0779571533203125, -0.07039260864257812, -0.06282806396484375, -0.055263519287109375, -0.047698974609375, -0.040134429931640625, -0.03256988525390625, -0.025005340576171875, -0.0174407958984375, -0.009876251220703125, -0.00231170654296875, 0.005252838134765625, 0.0128173828125, 0.020381927490234375, 0.02794647216796875, 0.035511016845703125, 0.0430755615234375, 0.050640106201171875, 0.05820465087890625, 0.06576919555664062, 0.073333740234375, 0.08089828491210938, 0.08846282958984375, 0.09602737426757812, 0.1035919189453125, 0.11115646362304688, 0.11872100830078125, 0.12628555297851562, 0.13385009765625, 0.14141464233398438, 0.14897918701171875, 0.15654373168945312, 0.1641082763671875, 0.17167282104492188, 0.17923736572265625, 0.18680191040039062, 0.194366455078125, 0.20193099975585938, 0.20949554443359375, 0.21706008911132812, 0.2246246337890625, 0.23218917846679688, 0.23975372314453125, 0.24731826782226562, 0.2548828125]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 6.0, 5.0, 6.0, 6.0, 16.0, 24.0, 27.0, 57.0, 64.0, 98.0, 113.0, 135.0, 148.0, 100.0, 72.0, 32.0, 21.0, 27.0, 10.0, 5.0, 10.0, 9.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.2398436069488525, -3.094416379928589, -2.948989152908325, -2.8035619258880615, -2.658134698867798, -2.512707471847534, -2.3672802448272705, -2.221853017807007, -2.076425790786743, -1.9309985637664795, -1.7855713367462158, -1.6401441097259521, -1.4947168827056885, -1.3492896556854248, -1.2038624286651611, -1.0584352016448975, -0.9130079746246338, -0.7675807476043701, -0.6221535205841064, -0.4767262935638428, -0.3312990665435791, -0.18587183952331543, -0.04044461250305176, 0.10498261451721191, 0.2504098415374756, 0.39583706855773926, 0.5412642955780029, 0.6866915225982666, 0.8321187496185303, 0.977545976638794, 1.1229732036590576, 1.2684004306793213, 1.4138274192810059, 1.5592546463012695, 1.7046818733215332, 1.8501091003417969, 1.9955363273620605, 2.140963554382324, 2.286390781402588, 2.4318180084228516, 2.5772452354431152, 2.722672462463379, 2.8680996894836426, 3.0135269165039062, 3.15895414352417, 3.3043813705444336, 3.4498085975646973, 3.595235824584961, 3.7406630516052246, 3.8860902786254883, 4.031517505645752, 4.176944732666016, 4.322371959686279, 4.467799186706543, 4.613226413726807, 4.75865364074707, 4.904080867767334, 5.049508094787598, 5.194935321807861, 5.340362548828125, 5.485789775848389, 5.631217002868652, 5.776644229888916, 5.92207145690918, 6.067498683929443]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 9.0, 3.0, 3.0, 11.0, 11.0, 13.0, 22.0, 19.0, 20.0, 22.0, 41.0, 38.0, 35.0, 34.0, 37.0, 41.0, 37.0, 44.0, 44.0, 40.0, 49.0, 41.0, 37.0, 46.0, 32.0, 38.0, 27.0, 26.0, 32.0, 27.0, 21.0, 26.0, 17.0, 14.0, 7.0, 8.0, 7.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.073009967803955, -4.921655654907227, -4.770301818847656, -4.618947505950928, -4.467593193054199, -4.316238880157471, -4.164884567260742, -4.013530731201172, -3.8621764183044434, -3.710822105407715, -3.5594680309295654, -3.408113956451416, -3.2567596435546875, -3.105405330657959, -2.9540512561798096, -2.80269718170166, -2.6513428688049316, -2.499988555908203, -2.3486344814300537, -2.1972804069519043, -2.045926094055176, -1.8945719003677368, -1.7432177066802979, -1.5918635129928589, -1.44050931930542, -1.289155125617981, -1.137800931930542, -0.986446738243103, -0.8350925445556641, -0.6837383508682251, -0.5323841571807861, -0.38102996349334717, -0.22967529296875, -0.07832109928131104, 0.07303309440612793, 0.2243872880935669, 0.37574148178100586, 0.5270956754684448, 0.6784498691558838, 0.8298040628433228, 0.9811582565307617, 1.1325124502182007, 1.2838666439056396, 1.4352208375930786, 1.5865750312805176, 1.7379292249679565, 1.8892834186553955, 2.040637493133545, 2.1919918060302734, 2.343346118927002, 2.4947001934051514, 2.646054267883301, 2.7974085807800293, 2.948762893676758, 3.1001169681549072, 3.2514710426330566, 3.402825355529785, 3.5541796684265137, 3.705533742904663, 3.8568878173828125, 4.008242130279541, 4.1595964431762695, 4.31095027923584, 4.462304592132568, 4.613658905029297]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 3.0, 8.0, 8.0, 13.0, 10.0, 14.0, 16.0, 21.0, 34.0, 40.0, 63.0, 76.0, 118.0, 244.0, 502.0, 1274.0, 3815.0, 13946.0, 76051.0, 1434287.0, 2543290.0, 96249.0, 16753.0, 4514.0, 1557.0, 642.0, 272.0, 146.0, 91.0, 57.0, 39.0, 26.0, 22.0, 16.0, 15.0, 12.0, 8.0, 12.0, 7.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427734375, -3.317352294921875, -3.20697021484375, -3.096588134765625, -2.9862060546875, -2.875823974609375, -2.76544189453125, -2.655059814453125, -2.544677734375, -2.434295654296875, -2.32391357421875, -2.213531494140625, -2.1031494140625, -1.992767333984375, -1.88238525390625, -1.772003173828125, -1.66162109375, -1.551239013671875, -1.44085693359375, -1.330474853515625, -1.2200927734375, -1.109710693359375, -0.99932861328125, -0.888946533203125, -0.778564453125, -0.668182373046875, -0.55780029296875, -0.447418212890625, -0.3370361328125, -0.226654052734375, -0.11627197265625, -0.005889892578125, 0.1044921875, 0.214874267578125, 0.32525634765625, 0.435638427734375, 0.5460205078125, 0.656402587890625, 0.76678466796875, 0.877166748046875, 0.987548828125, 1.097930908203125, 1.20831298828125, 1.318695068359375, 1.4290771484375, 1.539459228515625, 1.64984130859375, 1.760223388671875, 1.87060546875, 1.980987548828125, 2.09136962890625, 2.201751708984375, 2.3121337890625, 2.422515869140625, 2.53289794921875, 2.643280029296875, 2.753662109375, 2.864044189453125, 2.97442626953125, 3.084808349609375, 3.1951904296875, 3.305572509765625, 3.41595458984375, 3.526336669921875, 3.63671875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 10.0, 8.0, 14.0, 20.0, 21.0, 18.0, 25.0, 34.0, 51.0, 51.0, 73.0, 73.0, 95.0, 91.0, 71.0, 81.0, 53.0, 46.0, 31.0, 28.0, 24.0, 15.0, 19.0, 15.0, 10.0, 9.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.58984375, -2.5214080810546875, -2.452972412109375, -2.3845367431640625, -2.31610107421875, -2.2476654052734375, -2.179229736328125, -2.1107940673828125, -2.0423583984375, -1.9739227294921875, -1.905487060546875, -1.8370513916015625, -1.76861572265625, -1.7001800537109375, -1.631744384765625, -1.5633087158203125, -1.494873046875, -1.4264373779296875, -1.358001708984375, -1.2895660400390625, -1.22113037109375, -1.1526947021484375, -1.084259033203125, -1.0158233642578125, -0.9473876953125, -0.8789520263671875, -0.810516357421875, -0.7420806884765625, -0.67364501953125, -0.6052093505859375, -0.536773681640625, -0.4683380126953125, -0.39990234375, -0.3314666748046875, -0.263031005859375, -0.1945953369140625, -0.12615966796875, -0.0577239990234375, 0.010711669921875, 0.0791473388671875, 0.1475830078125, 0.2160186767578125, 0.284454345703125, 0.3528900146484375, 0.42132568359375, 0.4897613525390625, 0.558197021484375, 0.6266326904296875, 0.695068359375, 0.7635040283203125, 0.831939697265625, 0.9003753662109375, 0.96881103515625, 1.0372467041015625, 1.105682373046875, 1.1741180419921875, 1.2425537109375, 1.3109893798828125, 1.379425048828125, 1.4478607177734375, 1.51629638671875, 1.5847320556640625, 1.653167724609375, 1.7216033935546875, 1.7900390625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 10.0, 54.0, 323.0, 539411.0, 3654078.0, 358.0, 43.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -16.660888671875, -15.86865234375, -15.076416015625, -14.2841796875, -13.491943359375, -12.69970703125, -11.907470703125, -11.115234375, -10.322998046875, -9.53076171875, -8.738525390625, -7.9462890625, -7.154052734375, -6.36181640625, -5.569580078125, -4.77734375, -3.985107421875, -3.19287109375, -2.400634765625, -1.6083984375, -0.816162109375, -0.02392578125, 0.768310546875, 1.560546875, 2.352783203125, 3.14501953125, 3.937255859375, 4.7294921875, 5.521728515625, 6.31396484375, 7.106201171875, 7.8984375, 8.690673828125, 9.48291015625, 10.275146484375, 11.0673828125, 11.859619140625, 12.65185546875, 13.444091796875, 14.236328125, 15.028564453125, 15.82080078125, 16.613037109375, 17.4052734375, 18.197509765625, 18.98974609375, 19.781982421875, 20.57421875, 21.366455078125, 22.15869140625, 22.950927734375, 23.7431640625, 24.535400390625, 25.32763671875, 26.119873046875, 26.912109375, 27.704345703125, 28.49658203125, 29.288818359375, 30.0810546875, 30.873291015625, 31.66552734375, 32.457763671875, 33.25]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 7.0, 13.0, 5.0, 15.0, 14.0, 17.0, 16.0, 21.0, 48.0, 53.0, 63.0, 86.0, 177.0, 222.0, 425.0, 886.0, 828.0, 386.0, 260.0, 146.0, 120.0, 77.0, 57.0, 25.0, 33.0, 17.0, 18.0, 9.0, 8.0, 4.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.67041015625, -0.6506805419921875, -0.630950927734375, -0.6112213134765625, -0.59149169921875, -0.5717620849609375, -0.552032470703125, -0.5323028564453125, -0.5125732421875, -0.4928436279296875, -0.473114013671875, -0.4533843994140625, -0.43365478515625, -0.4139251708984375, -0.394195556640625, -0.3744659423828125, -0.354736328125, -0.3350067138671875, -0.315277099609375, -0.2955474853515625, -0.27581787109375, -0.2560882568359375, -0.236358642578125, -0.2166290283203125, -0.1968994140625, -0.1771697998046875, -0.157440185546875, -0.1377105712890625, -0.11798095703125, -0.0982513427734375, -0.078521728515625, -0.0587921142578125, -0.0390625, -0.0193328857421875, 0.000396728515625, 0.0201263427734375, 0.03985595703125, 0.0595855712890625, 0.079315185546875, 0.0990447998046875, 0.1187744140625, 0.1385040283203125, 0.158233642578125, 0.1779632568359375, 0.19769287109375, 0.2174224853515625, 0.237152099609375, 0.2568817138671875, 0.276611328125, 0.2963409423828125, 0.316070556640625, 0.3358001708984375, 0.35552978515625, 0.3752593994140625, 0.394989013671875, 0.4147186279296875, 0.4344482421875, 0.4541778564453125, 0.473907470703125, 0.4936370849609375, 0.51336669921875, 0.5330963134765625, 0.552825927734375, 0.5725555419921875, 0.59228515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 3.0, 8.0, 8.0, 11.0, 21.0, 26.0, 49.0, 83.0, 121.0, 172.0, 180.0, 117.0, 84.0, 45.0, 18.0, 17.0, 10.0, 9.0, 8.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.522580146789551, -3.3866825103759766, -3.2507848739624023, -3.114887237548828, -2.978989601135254, -2.8430919647216797, -2.7071945667266846, -2.5712969303131104, -2.435399293899536, -2.299501657485962, -2.1636040210723877, -2.0277063846588135, -1.8918088674545288, -1.7559112310409546, -1.62001371383667, -1.4841160774230957, -1.3482184410095215, -1.2123208045959473, -1.076423168182373, -0.9405256509780884, -0.8046280145645142, -0.6687303781509399, -0.5328328013420105, -0.39693522453308105, -0.26103758811950684, -0.125139981508255, 0.010757625102996826, 0.14665523171424866, 0.2825528383255005, 0.4184504747390747, 0.5543480515480042, 0.6902456283569336, 0.8261427879333496, 0.9620404243469238, 1.097938060760498, 1.2338355779647827, 1.369733214378357, 1.5056308507919312, 1.6415283679962158, 1.77742600440979, 1.9133236408233643, 2.0492212772369385, 2.1851189136505127, 2.321016550064087, 2.456913948059082, 2.5928115844726562, 2.7287092208862305, 2.8646068572998047, 3.000504493713379, 3.136402130126953, 3.2722997665405273, 3.4081974029541016, 3.544095039367676, 3.67999267578125, 3.815890073776245, 3.9517877101898193, 4.087685585021973, 4.223583221435547, 4.359480857849121, 4.495378494262695, 4.6312761306762695, 4.767173767089844, 4.903071403503418, 5.038969039916992, 5.174866199493408]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 8.0, 17.0, 5.0, 15.0, 14.0, 23.0, 26.0, 25.0, 37.0, 41.0, 40.0, 62.0, 70.0, 61.0, 67.0, 58.0, 61.0, 61.0, 57.0, 48.0, 45.0, 32.0, 33.0, 22.0, 22.0, 15.0, 6.0, 6.0, 9.0, 3.0, 3.0, 1.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2260286808013916, -2.1580471992492676, -2.0900659561157227, -2.0220844745635986, -1.9541029930114746, -1.8861216306686401, -1.8181402683258057, -1.7501587867736816, -1.6821773052215576, -1.6141959428787231, -1.5462144613265991, -1.4782330989837646, -1.4102516174316406, -1.3422702550888062, -1.2742888927459717, -1.2063074111938477, -1.1383260488510132, -1.0703446865081787, -1.0023632049560547, -0.9343818426132202, -0.8664003610610962, -0.7984189987182617, -0.7304375767707825, -0.6624561548233032, -0.594474732875824, -0.5264933109283447, -0.4585118889808655, -0.3905304968357086, -0.32254907488822937, -0.2545676529407501, -0.18658626079559326, -0.11860483884811401, -0.050623416900634766, 0.017357997596263885, 0.08533941209316254, 0.1533208191394806, 0.22130224108695984, 0.2892836630344391, 0.35726505517959595, 0.4252464771270752, 0.49322789907455444, 0.5612093210220337, 0.6291907429695129, 0.6971721649169922, 0.7651535272598267, 0.8331350088119507, 0.9011163711547852, 0.9690977931022644, 1.0370792150497437, 1.1050605773925781, 1.1730420589447021, 1.2410234212875366, 1.3090049028396606, 1.3769862651824951, 1.4449677467346191, 1.5129491090774536, 1.580930471420288, 1.6489118337631226, 1.7168933153152466, 1.784874677658081, 1.852856159210205, 1.9208375215530396, 1.988818883895874, 2.056800365447998, 2.124781847000122]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 2.0, 12.0, 17.0, 13.0, 34.0, 39.0, 50.0, 101.0, 222.0, 366.0, 698.0, 1708.0, 4960.0, 46410.0, 933310.0, 51841.0, 5399.0, 1736.0, 750.0, 356.0, 198.0, 120.0, 73.0, 34.0, 25.0, 19.0, 20.0, 8.0, 14.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6159439086914062, -0.5980987548828125, -0.5802536010742188, -0.562408447265625, -0.5445632934570312, -0.5267181396484375, -0.5088729858398438, -0.49102783203125, -0.47318267822265625, -0.4553375244140625, -0.43749237060546875, -0.419647216796875, -0.40180206298828125, -0.3839569091796875, -0.36611175537109375, -0.3482666015625, -0.33042144775390625, -0.3125762939453125, -0.29473114013671875, -0.276885986328125, -0.25904083251953125, -0.2411956787109375, -0.22335052490234375, -0.20550537109375, -0.18766021728515625, -0.1698150634765625, -0.15196990966796875, -0.134124755859375, -0.11627960205078125, -0.0984344482421875, -0.08058929443359375, -0.062744140625, -0.04489898681640625, -0.0270538330078125, -0.00920867919921875, 0.008636474609375, 0.02648162841796875, 0.0443267822265625, 0.06217193603515625, 0.08001708984375, 0.09786224365234375, 0.1157073974609375, 0.13355255126953125, 0.151397705078125, 0.16924285888671875, 0.1870880126953125, 0.20493316650390625, 0.2227783203125, 0.24062347412109375, 0.2584686279296875, 0.27631378173828125, 0.294158935546875, 0.31200408935546875, 0.3298492431640625, 0.34769439697265625, 0.36553955078125, 0.38338470458984375, 0.4012298583984375, 0.41907501220703125, 0.436920166015625, 0.45476531982421875, 0.4726104736328125, 0.49045562744140625, 0.50830078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 7.0, 4.0, 12.0, 13.0, 13.0, 15.0, 24.0, 34.0, 30.0, 41.0, 51.0, 64.0, 77.0, 70.0, 76.0, 67.0, 79.0, 51.0, 62.0, 45.0, 46.0, 28.0, 23.0, 13.0, 16.0, 13.0, 10.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3974609375, -1.348724365234375, -1.29998779296875, -1.251251220703125, -1.2025146484375, -1.153778076171875, -1.10504150390625, -1.056304931640625, -1.007568359375, -0.958831787109375, -0.91009521484375, -0.861358642578125, -0.8126220703125, -0.763885498046875, -0.71514892578125, -0.666412353515625, -0.61767578125, -0.568939208984375, -0.52020263671875, -0.471466064453125, -0.4227294921875, -0.373992919921875, -0.32525634765625, -0.276519775390625, -0.227783203125, -0.179046630859375, -0.13031005859375, -0.081573486328125, -0.0328369140625, 0.015899658203125, 0.06463623046875, 0.113372802734375, 0.162109375, 0.210845947265625, 0.25958251953125, 0.308319091796875, 0.3570556640625, 0.405792236328125, 0.45452880859375, 0.503265380859375, 0.552001953125, 0.600738525390625, 0.64947509765625, 0.698211669921875, 0.7469482421875, 0.795684814453125, 0.84442138671875, 0.893157958984375, 0.94189453125, 0.990631103515625, 1.03936767578125, 1.088104248046875, 1.1368408203125, 1.185577392578125, 1.23431396484375, 1.283050537109375, 1.331787109375, 1.380523681640625, 1.42926025390625, 1.477996826171875, 1.5267333984375, 1.575469970703125, 1.62420654296875, 1.672943115234375, 1.7216796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 10.0, 5.0, 4.0, 6.0, 7.0, 10.0, 12.0, 23.0, 31.0, 32.0, 37.0, 59.0, 92.0, 121.0, 156.0, 234.0, 324.0, 625.0, 1788.0, 8135.0, 65856.0, 697161.0, 246903.0, 20893.0, 3641.0, 1018.0, 421.0, 238.0, 176.0, 140.0, 90.0, 76.0, 56.0, 36.0, 25.0, 30.0, 21.0, 22.0, 11.0, 5.0, 10.0, 5.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.186767578125, -0.18106460571289062, -0.17536163330078125, -0.16965866088867188, -0.1639556884765625, -0.15825271606445312, -0.15254974365234375, -0.14684677124023438, -0.141143798828125, -0.13544082641601562, -0.12973785400390625, -0.12403488159179688, -0.1183319091796875, -0.11262893676757812, -0.10692596435546875, -0.10122299194335938, -0.09552001953125, -0.08981704711914062, -0.08411407470703125, -0.07841110229492188, -0.0727081298828125, -0.06700515747070312, -0.06130218505859375, -0.055599212646484375, -0.049896240234375, -0.044193267822265625, -0.03849029541015625, -0.032787322998046875, -0.0270843505859375, -0.021381378173828125, -0.01567840576171875, -0.009975433349609375, -0.0042724609375, 0.001430511474609375, 0.00713348388671875, 0.012836456298828125, 0.0185394287109375, 0.024242401123046875, 0.02994537353515625, 0.035648345947265625, 0.041351318359375, 0.047054290771484375, 0.05275726318359375, 0.058460235595703125, 0.0641632080078125, 0.06986618041992188, 0.07556915283203125, 0.08127212524414062, 0.08697509765625, 0.09267807006835938, 0.09838104248046875, 0.10408401489257812, 0.1097869873046875, 0.11548995971679688, 0.12119293212890625, 0.12689590454101562, 0.132598876953125, 0.13830184936523438, 0.14400482177734375, 0.14970779418945312, 0.1554107666015625, 0.16111373901367188, 0.16681671142578125, 0.17251968383789062, 0.17822265625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 6.0, 5.0, 5.0, 4.0, 7.0, 8.0, 9.0, 14.0, 17.0, 13.0, 26.0, 23.0, 33.0, 30.0, 38.0, 33.0, 33.0, 51.0, 52.0, 43.0, 37.0, 56.0, 50.0, 51.0, 46.0, 46.0, 33.0, 32.0, 34.0, 25.0, 20.0, 25.0, 12.0, 7.0, 19.0, 12.0, 6.0, 4.0, 6.0, 9.0, 5.0, 2.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.7373046875, -1.6831512451171875, -1.628997802734375, -1.5748443603515625, -1.52069091796875, -1.4665374755859375, -1.412384033203125, -1.3582305908203125, -1.3040771484375, -1.2499237060546875, -1.195770263671875, -1.1416168212890625, -1.08746337890625, -1.0333099365234375, -0.979156494140625, -0.9250030517578125, -0.870849609375, -0.8166961669921875, -0.762542724609375, -0.7083892822265625, -0.65423583984375, -0.6000823974609375, -0.545928955078125, -0.4917755126953125, -0.4376220703125, -0.3834686279296875, -0.329315185546875, -0.2751617431640625, -0.22100830078125, -0.1668548583984375, -0.112701416015625, -0.0585479736328125, -0.00439453125, 0.0497589111328125, 0.103912353515625, 0.1580657958984375, 0.21221923828125, 0.2663726806640625, 0.320526123046875, 0.3746795654296875, 0.4288330078125, 0.4829864501953125, 0.537139892578125, 0.5912933349609375, 0.64544677734375, 0.6996002197265625, 0.753753662109375, 0.8079071044921875, 0.862060546875, 0.9162139892578125, 0.970367431640625, 1.0245208740234375, 1.07867431640625, 1.1328277587890625, 1.186981201171875, 1.2411346435546875, 1.2952880859375, 1.3494415283203125, 1.403594970703125, 1.4577484130859375, 1.51190185546875, 1.5660552978515625, 1.620208740234375, 1.6743621826171875, 1.728515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 2.0, 8.0, 12.0, 12.0, 14.0, 22.0, 39.0, 61.0, 74.0, 143.0, 252.0, 500.0, 1066.0, 3315.0, 24582.0, 908590.0, 101097.0, 5840.0, 1489.0, 608.0, 299.0, 200.0, 112.0, 58.0, 45.0, 28.0, 17.0, 12.0, 13.0, 9.0, 10.0, 5.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047271728515625, -0.0456242561340332, -0.043976783752441406, -0.04232931137084961, -0.04068183898925781, -0.039034366607666016, -0.03738689422607422, -0.03573942184448242, -0.034091949462890625, -0.03244447708129883, -0.03079700469970703, -0.029149532318115234, -0.027502059936523438, -0.02585458755493164, -0.024207115173339844, -0.022559642791748047, -0.02091217041015625, -0.019264698028564453, -0.017617225646972656, -0.01596975326538086, -0.014322280883789062, -0.012674808502197266, -0.011027336120605469, -0.009379863739013672, -0.007732391357421875, -0.006084918975830078, -0.004437446594238281, -0.0027899742126464844, -0.0011425018310546875, 0.0005049705505371094, 0.0021524429321289062, 0.003799915313720703, 0.0054473876953125, 0.007094860076904297, 0.008742332458496094, 0.01038980484008789, 0.012037277221679688, 0.013684749603271484, 0.015332221984863281, 0.016979694366455078, 0.018627166748046875, 0.020274639129638672, 0.02192211151123047, 0.023569583892822266, 0.025217056274414062, 0.02686452865600586, 0.028512001037597656, 0.030159473419189453, 0.03180694580078125, 0.03345441818237305, 0.035101890563964844, 0.03674936294555664, 0.03839683532714844, 0.040044307708740234, 0.04169178009033203, 0.04333925247192383, 0.044986724853515625, 0.04663419723510742, 0.04828166961669922, 0.049929141998291016, 0.05157661437988281, 0.05322408676147461, 0.054871559143066406, 0.0565190315246582, 0.05816650390625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 7.0, 2.0, 6.0, 11.0, 9.0, 13.0, 24.0, 39.0, 60.0, 62.0, 74.0, 91.0, 100.0, 101.0, 88.0, 70.0, 45.0, 47.0, 42.0, 24.0, 19.0, 13.0, 13.0, 11.0, 4.0, 4.0, 6.0, 3.0, 1.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5139579772949219e-05, -1.4559365808963776e-05, -1.3979151844978333e-05, -1.339893788099289e-05, -1.2818723917007446e-05, -1.2238509953022003e-05, -1.165829598903656e-05, -1.1078082025051117e-05, -1.0497868061065674e-05, -9.91765409708023e-06, -9.337440133094788e-06, -8.757226169109344e-06, -8.177012205123901e-06, -7.596798241138458e-06, -7.016584277153015e-06, -6.436370313167572e-06, -5.856156349182129e-06, -5.275942385196686e-06, -4.695728421211243e-06, -4.1155144572257996e-06, -3.5353004932403564e-06, -2.9550865292549133e-06, -2.3748725652694702e-06, -1.794658601284027e-06, -1.214444637298584e-06, -6.342306733131409e-07, -5.4016709327697754e-08, 5.261972546577454e-07, 1.1064112186431885e-06, 1.6866251826286316e-06, 2.2668391466140747e-06, 2.847053110599518e-06, 3.427267074584961e-06, 4.007481038570404e-06, 4.587695002555847e-06, 5.16790896654129e-06, 5.748122930526733e-06, 6.3283368945121765e-06, 6.90855085849762e-06, 7.488764822483063e-06, 8.068978786468506e-06, 8.649192750453949e-06, 9.229406714439392e-06, 9.809620678424835e-06, 1.0389834642410278e-05, 1.0970048606395721e-05, 1.1550262570381165e-05, 1.2130476534366608e-05, 1.271069049835205e-05, 1.3290904462337494e-05, 1.3871118426322937e-05, 1.445133239030838e-05, 1.5031546354293823e-05, 1.5611760318279266e-05, 1.619197428226471e-05, 1.6772188246250153e-05, 1.7352402210235596e-05, 1.793261617422104e-05, 1.8512830138206482e-05, 1.9093044102191925e-05, 1.9673258066177368e-05, 2.025347203016281e-05, 2.0833685994148254e-05, 2.1413899958133698e-05, 2.199411392211914e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 2.0, 5.0, 7.0, 20.0, 17.0, 30.0, 19.0, 42.0, 55.0, 132.0, 162.0, 305.0, 569.0, 1133.0, 2623.0, 7785.0, 35399.0, 604610.0, 356657.0, 27501.0, 6892.0, 2333.0, 1035.0, 539.0, 268.0, 130.0, 82.0, 54.0, 46.0, 29.0, 21.0, 11.0, 5.0, 9.0, 2.0, 4.0, 3.0, 2.0, 5.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.048675537109375, -0.04719734191894531, -0.045719146728515625, -0.04424095153808594, -0.04276275634765625, -0.04128456115722656, -0.039806365966796875, -0.03832817077636719, -0.0368499755859375, -0.03537178039550781, -0.033893585205078125, -0.03241539001464844, -0.03093719482421875, -0.029458999633789062, -0.027980804443359375, -0.026502609252929688, -0.0250244140625, -0.023546218872070312, -0.022068023681640625, -0.020589828491210938, -0.01911163330078125, -0.017633438110351562, -0.016155242919921875, -0.014677047729492188, -0.0131988525390625, -0.011720657348632812, -0.010242462158203125, -0.008764266967773438, -0.00728607177734375, -0.0058078765869140625, -0.004329681396484375, -0.0028514862060546875, -0.001373291015625, 0.0001049041748046875, 0.001583099365234375, 0.0030612945556640625, 0.00453948974609375, 0.0060176849365234375, 0.007495880126953125, 0.008974075317382812, 0.0104522705078125, 0.011930465698242188, 0.013408660888671875, 0.014886856079101562, 0.01636505126953125, 0.017843246459960938, 0.019321441650390625, 0.020799636840820312, 0.02227783203125, 0.023756027221679688, 0.025234222412109375, 0.026712417602539062, 0.02819061279296875, 0.029668807983398438, 0.031147003173828125, 0.03262519836425781, 0.0341033935546875, 0.03558158874511719, 0.037059783935546875, 0.03853797912597656, 0.04001617431640625, 0.04149436950683594, 0.042972564697265625, 0.04445075988769531, 0.045928955078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 8.0, 27.0, 30.0, 25.0, 50.0, 54.0, 96.0, 99.0, 118.0, 122.0, 77.0, 61.0, 55.0, 33.0, 18.0, 19.0, 15.0, 9.0, 10.0, 6.0, 1.0, 8.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005458831787109375, -0.005296289920806885, -0.0051337480545043945, -0.004971206188201904, -0.004808664321899414, -0.004646122455596924, -0.004483580589294434, -0.004321038722991943, -0.004158496856689453, -0.003995954990386963, -0.0038334131240844727, -0.0036708712577819824, -0.003508329391479492, -0.003345787525177002, -0.0031832456588745117, -0.0030207037925720215, -0.0028581619262695312, -0.002695620059967041, -0.0025330781936645508, -0.0023705363273620605, -0.0022079944610595703, -0.00204545259475708, -0.0018829107284545898, -0.0017203688621520996, -0.0015578269958496094, -0.0013952851295471191, -0.001232743263244629, -0.0010702013969421387, -0.0009076595306396484, -0.0007451176643371582, -0.000582575798034668, -0.00042003393173217773, -0.0002574920654296875, -9.495019912719727e-05, 6.759166717529297e-05, 0.0002301335334777832, 0.00039267539978027344, 0.0005552172660827637, 0.0007177591323852539, 0.0008803009986877441, 0.0010428428649902344, 0.0012053847312927246, 0.0013679265975952148, 0.001530468463897705, 0.0016930103302001953, 0.0018555521965026855, 0.0020180940628051758, 0.002180635929107666, 0.0023431777954101562, 0.0025057196617126465, 0.0026682615280151367, 0.002830803394317627, 0.002993345260620117, 0.0031558871269226074, 0.0033184289932250977, 0.003480970859527588, 0.003643512725830078, 0.0038060545921325684, 0.003968596458435059, 0.004131138324737549, 0.004293680191040039, 0.004456222057342529, 0.0046187639236450195, 0.00478130578994751, 0.00494384765625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 7.0, 6.0, 6.0, 11.0, 24.0, 29.0, 55.0, 93.0, 159.0, 210.0, 163.0, 109.0, 47.0, 28.0, 15.0, 8.0, 12.0, 12.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.2944765090942383, -2.2006967067718506, -2.106916904449463, -2.013137102127075, -1.919357419013977, -1.8255776166915894, -1.7317979335784912, -1.6380181312561035, -1.5442383289337158, -1.4504585266113281, -1.3566787242889404, -1.2628990411758423, -1.1691192388534546, -1.075339436531067, -0.981559693813324, -0.887779951095581, -0.7940001487731934, -0.7002203464508057, -0.6064406037330627, -0.5126608610153198, -0.41888105869293213, -0.3251012861728668, -0.2313215136528015, -0.1375417709350586, -0.0437619686126709, 0.05001780390739441, 0.14379757642745972, 0.23757734894752502, 0.33135712146759033, 0.42513689398765564, 0.518916666507721, 0.6126964092254639, 0.7064764499664307, 0.8002562522888184, 0.8940359950065613, 0.9878157377243042, 1.081595540046692, 1.1753753423690796, 1.2691550254821777, 1.3629348278045654, 1.4567146301269531, 1.5504944324493408, 1.6442742347717285, 1.7380539178848267, 1.8318337202072144, 1.925613522529602, 2.0193932056427, 2.113173007965088, 2.2069528102874756, 2.3007326126098633, 2.394512414932251, 2.4882922172546387, 2.5820717811584473, 2.675851583480835, 2.7696313858032227, 2.8634111881256104, 2.957190990447998, 3.0509707927703857, 3.1447505950927734, 3.238530397415161, 3.332310199737549, 3.4260897636413574, 3.519869565963745, 3.613649368286133, 3.7074291706085205]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 10.0, 14.0, 9.0, 18.0, 27.0, 28.0, 30.0, 44.0, 50.0, 82.0, 82.0, 85.0, 78.0, 78.0, 76.0, 57.0, 60.0, 40.0, 35.0, 24.0, 21.0, 13.0, 7.0, 6.0, 9.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.8428611755371094, -1.7918403148651123, -1.7408194541931152, -1.6897985935211182, -1.6387776136398315, -1.5877567529678345, -1.5367358922958374, -1.4857150316238403, -1.4346940517425537, -1.3836731910705566, -1.3326523303985596, -1.2816314697265625, -1.2306104898452759, -1.1795896291732788, -1.1285687685012817, -1.0775479078292847, -1.0265270471572876, -0.9755061864852905, -0.9244852662086487, -0.8734644055366516, -0.8224434852600098, -0.7714226245880127, -0.7204017639160156, -0.6693809032440186, -0.6183599829673767, -0.5673391222953796, -0.5163182020187378, -0.4652973413467407, -0.41427645087242126, -0.3632555603981018, -0.31223469972610474, -0.2612138092517853, -0.21019303798675537, -0.1591721475124359, -0.10815127193927765, -0.057130396366119385, -0.006109505891799927, 0.04491138458251953, 0.0959322452545166, 0.14695313572883606, 0.19797402620315552, 0.24899491667747498, 0.30001580715179443, 0.3510366678237915, 0.40205755829811096, 0.4530784487724304, 0.5040993094444275, 0.5551202297210693, 0.6061410903930664, 0.6571619510650635, 0.7081828713417053, 0.7592037320137024, 0.8102246522903442, 0.8612455129623413, 0.9122663736343384, 0.9632872343063354, 1.014308214187622, 1.0653290748596191, 1.1163499355316162, 1.1673707962036133, 1.2183917760849, 1.269412636756897, 1.320433497428894, 1.3714543581008911, 1.4224752187728882]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 4.0, 9.0, 8.0, 13.0, 15.0, 16.0, 45.0, 58.0, 88.0, 173.0, 242.0, 444.0, 719.0, 1572.0, 3322.0, 7580.0, 21612.0, 79424.0, 679198.0, 194911.0, 37467.0, 12080.0, 4760.0, 2235.0, 1123.0, 580.0, 312.0, 208.0, 117.0, 69.0, 43.0, 34.0, 24.0, 17.0, 8.0, 13.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6416015625, -1.589874267578125, -1.53814697265625, -1.486419677734375, -1.4346923828125, -1.382965087890625, -1.33123779296875, -1.279510498046875, -1.227783203125, -1.176055908203125, -1.12432861328125, -1.072601318359375, -1.0208740234375, -0.969146728515625, -0.91741943359375, -0.865692138671875, -0.81396484375, -0.762237548828125, -0.71051025390625, -0.658782958984375, -0.6070556640625, -0.555328369140625, -0.50360107421875, -0.451873779296875, -0.400146484375, -0.348419189453125, -0.29669189453125, -0.244964599609375, -0.1932373046875, -0.141510009765625, -0.08978271484375, -0.038055419921875, 0.013671875, 0.065399169921875, 0.11712646484375, 0.168853759765625, 0.2205810546875, 0.272308349609375, 0.32403564453125, 0.375762939453125, 0.427490234375, 0.479217529296875, 0.53094482421875, 0.582672119140625, 0.6343994140625, 0.686126708984375, 0.73785400390625, 0.789581298828125, 0.84130859375, 0.893035888671875, 0.94476318359375, 0.996490478515625, 1.0482177734375, 1.099945068359375, 1.15167236328125, 1.203399658203125, 1.255126953125, 1.306854248046875, 1.35858154296875, 1.410308837890625, 1.4620361328125, 1.513763427734375, 1.56549072265625, 1.617218017578125, 1.6689453125]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 8.0, 9.0, 10.0, 14.0, 17.0, 30.0, 30.0, 45.0, 45.0, 50.0, 67.0, 68.0, 97.0, 74.0, 73.0, 62.0, 65.0, 55.0, 45.0, 29.0, 27.0, 22.0, 16.0, 10.0, 9.0, 5.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.732421875, -2.627960205078125, -2.52349853515625, -2.419036865234375, -2.3145751953125, -2.210113525390625, -2.10565185546875, -2.001190185546875, -1.896728515625, -1.792266845703125, -1.68780517578125, -1.583343505859375, -1.4788818359375, -1.374420166015625, -1.26995849609375, -1.165496826171875, -1.06103515625, -0.956573486328125, -0.85211181640625, -0.747650146484375, -0.6431884765625, -0.538726806640625, -0.43426513671875, -0.329803466796875, -0.225341796875, -0.120880126953125, -0.01641845703125, 0.088043212890625, 0.1925048828125, 0.296966552734375, 0.40142822265625, 0.505889892578125, 0.6103515625, 0.714813232421875, 0.81927490234375, 0.923736572265625, 1.0281982421875, 1.132659912109375, 1.23712158203125, 1.341583251953125, 1.446044921875, 1.550506591796875, 1.65496826171875, 1.759429931640625, 1.8638916015625, 1.968353271484375, 2.07281494140625, 2.177276611328125, 2.28173828125, 2.386199951171875, 2.49066162109375, 2.595123291015625, 2.6995849609375, 2.804046630859375, 2.90850830078125, 3.012969970703125, 3.117431640625, 3.221893310546875, 3.32635498046875, 3.430816650390625, 3.5352783203125, 3.639739990234375, 3.74420166015625, 3.848663330078125, 3.953125]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 9.0, 7.0, 2.0, 13.0, 12.0, 8.0, 20.0, 11.0, 12.0, 22.0, 29.0, 33.0, 33.0, 27.0, 40.0, 39.0, 54.0, 166.0, 2065.0, 972740.0, 72065.0, 689.0, 98.0, 46.0, 49.0, 45.0, 40.0, 28.0, 23.0, 14.0, 17.0, 17.0, 16.0, 17.0, 8.0, 11.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.12890625, -6.88995361328125, -6.6510009765625, -6.41204833984375, -6.173095703125, -5.93414306640625, -5.6951904296875, -5.45623779296875, -5.21728515625, -4.97833251953125, -4.7393798828125, -4.50042724609375, -4.261474609375, -4.02252197265625, -3.7835693359375, -3.54461669921875, -3.3056640625, -3.06671142578125, -2.8277587890625, -2.58880615234375, -2.349853515625, -2.11090087890625, -1.8719482421875, -1.63299560546875, -1.39404296875, -1.15509033203125, -0.9161376953125, -0.67718505859375, -0.438232421875, -0.19927978515625, 0.0396728515625, 0.27862548828125, 0.517578125, 0.75653076171875, 0.9954833984375, 1.23443603515625, 1.473388671875, 1.71234130859375, 1.9512939453125, 2.19024658203125, 2.42919921875, 2.66815185546875, 2.9071044921875, 3.14605712890625, 3.385009765625, 3.62396240234375, 3.8629150390625, 4.10186767578125, 4.3408203125, 4.57977294921875, 4.8187255859375, 5.05767822265625, 5.296630859375, 5.53558349609375, 5.7745361328125, 6.01348876953125, 6.25244140625, 6.49139404296875, 6.7303466796875, 6.96929931640625, 7.208251953125, 7.44720458984375, 7.6861572265625, 7.92510986328125, 8.1640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 9.0, 9.0, 5.0, 14.0, 14.0, 7.0, 9.0, 16.0, 20.0, 29.0, 22.0, 33.0, 26.0, 34.0, 38.0, 38.0, 45.0, 42.0, 49.0, 40.0, 50.0, 42.0, 46.0, 48.0, 38.0, 45.0, 33.0, 35.0, 27.0, 17.0, 18.0, 16.0, 11.0, 13.0, 16.0, 10.0, 14.0, 6.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1953125, -2.121826171875, -2.04833984375, -1.974853515625, -1.9013671875, -1.827880859375, -1.75439453125, -1.680908203125, -1.607421875, -1.533935546875, -1.46044921875, -1.386962890625, -1.3134765625, -1.239990234375, -1.16650390625, -1.093017578125, -1.01953125, -0.946044921875, -0.87255859375, -0.799072265625, -0.7255859375, -0.652099609375, -0.57861328125, -0.505126953125, -0.431640625, -0.358154296875, -0.28466796875, -0.211181640625, -0.1376953125, -0.064208984375, 0.00927734375, 0.082763671875, 0.15625, 0.229736328125, 0.30322265625, 0.376708984375, 0.4501953125, 0.523681640625, 0.59716796875, 0.670654296875, 0.744140625, 0.817626953125, 0.89111328125, 0.964599609375, 1.0380859375, 1.111572265625, 1.18505859375, 1.258544921875, 1.33203125, 1.405517578125, 1.47900390625, 1.552490234375, 1.6259765625, 1.699462890625, 1.77294921875, 1.846435546875, 1.919921875, 1.993408203125, 2.06689453125, 2.140380859375, 2.2138671875, 2.287353515625, 2.36083984375, 2.434326171875, 2.5078125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 6.0, 7.0, 12.0, 20.0, 22.0, 24.0, 33.0, 47.0, 65.0, 113.0, 177.0, 289.0, 417.0, 780.0, 1492.0, 2901.0, 6250.0, 15551.0, 44991.0, 180209.0, 660021.0, 88748.0, 27079.0, 10147.0, 4459.0, 2063.0, 1056.0, 588.0, 322.0, 222.0, 132.0, 93.0, 60.0, 40.0, 32.0, 22.0, 6.0, 14.0, 6.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.408935546875, -0.3954277038574219, -0.38191986083984375, -0.3684120178222656, -0.3549041748046875, -0.3413963317871094, -0.32788848876953125, -0.3143806457519531, -0.300872802734375, -0.2873649597167969, -0.27385711669921875, -0.2603492736816406, -0.2468414306640625, -0.23333358764648438, -0.21982574462890625, -0.20631790161132812, -0.19281005859375, -0.17930221557617188, -0.16579437255859375, -0.15228652954101562, -0.1387786865234375, -0.12527084350585938, -0.11176300048828125, -0.09825515747070312, -0.084747314453125, -0.07123947143554688, -0.05773162841796875, -0.044223785400390625, -0.0307159423828125, -0.017208099365234375, -0.00370025634765625, 0.009807586669921875, 0.0233154296875, 0.036823272705078125, 0.05033111572265625, 0.06383895874023438, 0.0773468017578125, 0.09085464477539062, 0.10436248779296875, 0.11787033081054688, 0.131378173828125, 0.14488601684570312, 0.15839385986328125, 0.17190170288085938, 0.1854095458984375, 0.19891738891601562, 0.21242523193359375, 0.22593307495117188, 0.23944091796875, 0.2529487609863281, 0.26645660400390625, 0.2799644470214844, 0.2934722900390625, 0.3069801330566406, 0.32048797607421875, 0.3339958190917969, 0.347503662109375, 0.3610115051269531, 0.37451934814453125, 0.3880271911621094, 0.4015350341796875, 0.4150428771972656, 0.42855072021484375, 0.4420585632324219, 0.45556640625]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 6.0, 7.0, 6.0, 6.0, 7.0, 9.0, 11.0, 19.0, 42.0, 29.0, 52.0, 86.0, 144.0, 180.0, 115.0, 75.0, 51.0, 32.0, 33.0, 26.0, 14.0, 12.0, 7.0, 5.0, 6.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.237361907958984e-05, -7.989630103111267e-05, -7.74189829826355e-05, -7.494166493415833e-05, -7.246434688568115e-05, -6.998702883720398e-05, -6.75097107887268e-05, -6.503239274024963e-05, -6.255507469177246e-05, -6.007775664329529e-05, -5.7600438594818115e-05, -5.512312054634094e-05, -5.264580249786377e-05, -5.01684844493866e-05, -4.7691166400909424e-05, -4.521384835243225e-05, -4.273653030395508e-05, -4.0259212255477905e-05, -3.778189420700073e-05, -3.530457615852356e-05, -3.282725811004639e-05, -3.0349940061569214e-05, -2.787262201309204e-05, -2.5395303964614868e-05, -2.2917985916137695e-05, -2.0440667867660522e-05, -1.796334981918335e-05, -1.5486031770706177e-05, -1.3008713722229004e-05, -1.0531395673751831e-05, -8.054077625274658e-06, -5.576759576797485e-06, -3.0994415283203125e-06, -6.221234798431396e-07, 1.8551945686340332e-06, 4.332512617111206e-06, 6.809830665588379e-06, 9.287148714065552e-06, 1.1764466762542725e-05, 1.4241784811019897e-05, 1.671910285949707e-05, 1.9196420907974243e-05, 2.1673738956451416e-05, 2.415105700492859e-05, 2.6628375053405762e-05, 2.9105693101882935e-05, 3.158301115036011e-05, 3.406032919883728e-05, 3.653764724731445e-05, 3.9014965295791626e-05, 4.14922833442688e-05, 4.396960139274597e-05, 4.6446919441223145e-05, 4.892423748970032e-05, 5.140155553817749e-05, 5.387887358665466e-05, 5.6356191635131836e-05, 5.883350968360901e-05, 6.131082773208618e-05, 6.378814578056335e-05, 6.626546382904053e-05, 6.87427818775177e-05, 7.122009992599487e-05, 7.369741797447205e-05, 7.617473602294922e-05]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 7.0, 12.0, 21.0, 16.0, 34.0, 77.0, 123.0, 211.0, 347.0, 751.0, 1625.0, 4387.0, 15869.0, 85932.0, 807721.0, 104901.0, 18155.0, 4883.0, 1752.0, 817.0, 382.0, 211.0, 117.0, 65.0, 47.0, 25.0, 23.0, 10.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.70281982421875, -0.6805419921875, -0.65826416015625, -0.635986328125, -0.61370849609375, -0.5914306640625, -0.56915283203125, -0.546875, -0.52459716796875, -0.5023193359375, -0.48004150390625, -0.457763671875, -0.43548583984375, -0.4132080078125, -0.39093017578125, -0.36865234375, -0.34637451171875, -0.3240966796875, -0.30181884765625, -0.279541015625, -0.25726318359375, -0.2349853515625, -0.21270751953125, -0.1904296875, -0.16815185546875, -0.1458740234375, -0.12359619140625, -0.101318359375, -0.07904052734375, -0.0567626953125, -0.03448486328125, -0.01220703125, 0.01007080078125, 0.0323486328125, 0.05462646484375, 0.076904296875, 0.09918212890625, 0.1214599609375, 0.14373779296875, 0.166015625, 0.18829345703125, 0.2105712890625, 0.23284912109375, 0.255126953125, 0.27740478515625, 0.2996826171875, 0.32196044921875, 0.34423828125, 0.36651611328125, 0.3887939453125, 0.41107177734375, 0.433349609375, 0.45562744140625, 0.4779052734375, 0.50018310546875, 0.5224609375, 0.54473876953125, 0.5670166015625, 0.58929443359375, 0.611572265625, 0.63385009765625, 0.6561279296875, 0.67840576171875, 0.70068359375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 3.0, 6.0, 6.0, 13.0, 13.0, 20.0, 21.0, 27.0, 27.0, 52.0, 46.0, 147.0, 238.0, 139.0, 47.0, 39.0, 26.0, 26.0, 18.0, 11.0, 10.0, 8.0, 10.0, 3.0, 8.0, 6.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.21334266662597656, -0.20610427856445312, -0.1988658905029297, -0.19162750244140625, -0.1843891143798828, -0.17715072631835938, -0.16991233825683594, -0.1626739501953125, -0.15543556213378906, -0.14819717407226562, -0.1409587860107422, -0.13372039794921875, -0.1264820098876953, -0.11924362182617188, -0.11200523376464844, -0.104766845703125, -0.09752845764160156, -0.09029006958007812, -0.08305168151855469, -0.07581329345703125, -0.06857490539550781, -0.061336517333984375, -0.05409812927246094, -0.0468597412109375, -0.03962135314941406, -0.032382965087890625, -0.025144577026367188, -0.01790618896484375, -0.010667800903320312, -0.003429412841796875, 0.0038089752197265625, 0.01104736328125, 0.018285751342773438, 0.025524139404296875, 0.03276252746582031, 0.04000091552734375, 0.04723930358886719, 0.054477691650390625, 0.06171607971191406, 0.0689544677734375, 0.07619285583496094, 0.08343124389648438, 0.09066963195800781, 0.09790802001953125, 0.10514640808105469, 0.11238479614257812, 0.11962318420410156, 0.126861572265625, 0.13409996032714844, 0.14133834838867188, 0.1485767364501953, 0.15581512451171875, 0.1630535125732422, 0.17029190063476562, 0.17753028869628906, 0.1847686767578125, 0.19200706481933594, 0.19924545288085938, 0.2064838409423828, 0.21372222900390625, 0.2209606170654297, 0.22819900512695312, 0.23543739318847656, 0.24267578125]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 8.0, 17.0, 27.0, 59.0, 115.0, 197.0, 279.0, 158.0, 66.0, 27.0, 23.0, 11.0, 10.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.701128959655762, -4.442842960357666, -4.18455696105957, -3.9262707233428955, -3.6679847240448, -3.409698724746704, -3.1514124870300293, -2.8931264877319336, -2.634840488433838, -2.376554489135742, -2.1182684898376465, -1.8599822521209717, -1.601696252822876, -1.3434102535247803, -1.085124135017395, -0.8268380165100098, -0.5685520172119141, -0.3102659583091736, -0.051979899406433105, 0.20630615949630737, 0.46459221839904785, 0.7228782176971436, 0.9811643362045288, 1.239450454711914, 1.4977364540100098, 1.7560224533081055, 2.014308452606201, 2.272594690322876, 2.5308806896209717, 2.7891666889190674, 3.047452926635742, 3.305738925933838, 3.5640249252319336, 3.8223109245300293, 4.080596923828125, 4.338882923126221, 4.597168922424316, 4.85545539855957, 5.113741397857666, 5.372027397155762, 5.630313396453857, 5.888599395751953, 6.146885395050049, 6.4051713943481445, 6.663457870483398, 6.921743392944336, 7.18002986907959, 7.4383158683776855, 7.696601867675781, 7.954887866973877, 8.213173866271973, 8.471460342407227, 8.729745864868164, 8.988032341003418, 9.246317863464355, 9.50460433959961, 9.762889862060547, 10.0211763381958, 10.279461860656738, 10.537748336791992, 10.79603385925293, 11.054320335388184, 11.312605857849121, 11.570892333984375, 11.829178810119629]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 9.0, 4.0, 10.0, 9.0, 8.0, 11.0, 20.0, 17.0, 24.0, 40.0, 26.0, 39.0, 39.0, 52.0, 55.0, 48.0, 62.0, 65.0, 59.0, 53.0, 37.0, 48.0, 50.0, 44.0, 36.0, 18.0, 22.0, 20.0, 15.0, 22.0, 10.0, 8.0, 6.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5405592918396, -4.394334316253662, -4.248109340667725, -4.101884365081787, -3.9556591510772705, -3.809434175491333, -3.6632089614868164, -3.516983985900879, -3.3707590103149414, -3.224534034729004, -3.0783090591430664, -2.93208384513855, -2.7858588695526123, -2.639633893966675, -2.493408679962158, -2.3471837043762207, -2.200958728790283, -2.0547337532043457, -1.9085086584091187, -1.7622835636138916, -1.616058588027954, -1.4698336124420166, -1.3236085176467896, -1.1773834228515625, -1.031158447265625, -0.8849334120750427, -0.7387083768844604, -0.5924833416938782, -0.4462583065032959, -0.3000332713127136, -0.15380823612213135, -0.007583141326904297, 0.1386418342590332, 0.2848668694496155, 0.43109190464019775, 0.57731693983078, 0.7235419750213623, 0.8697670102119446, 1.0159920454025269, 1.162217140197754, 1.3084421157836914, 1.454667091369629, 1.600892186164856, 1.747117280960083, 1.8933422565460205, 2.039567232131958, 2.1857924461364746, 2.332017421722412, 2.4782423973083496, 2.624467372894287, 2.7706923484802246, 2.916917562484741, 3.0631425380706787, 3.209367513656616, 3.355592727661133, 3.5018177032470703, 3.648042678833008, 3.7942676544189453, 3.940492630004883, 4.08671760559082, 4.232942581176758, 4.3791680335998535, 4.525393009185791, 4.6716179847717285, 4.817842960357666]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 7.0, 4.0, 10.0, 17.0, 15.0, 20.0, 42.0, 54.0, 89.0, 116.0, 197.0, 349.0, 670.0, 1338.0, 2986.0, 7743.0, 24695.0, 114171.0, 1227746.0, 2580844.0, 179862.0, 35527.0, 10518.0, 3790.0, 1661.0, 786.0, 398.0, 239.0, 126.0, 80.0, 63.0, 38.0, 28.0, 20.0, 11.0, 6.0, 8.0, 5.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.171875, -2.099761962890625, -2.02764892578125, -1.955535888671875, -1.8834228515625, -1.811309814453125, -1.73919677734375, -1.667083740234375, -1.594970703125, -1.522857666015625, -1.45074462890625, -1.378631591796875, -1.3065185546875, -1.234405517578125, -1.16229248046875, -1.090179443359375, -1.01806640625, -0.945953369140625, -0.87384033203125, -0.801727294921875, -0.7296142578125, -0.657501220703125, -0.58538818359375, -0.513275146484375, -0.441162109375, -0.369049072265625, -0.29693603515625, -0.224822998046875, -0.1527099609375, -0.080596923828125, -0.00848388671875, 0.063629150390625, 0.1357421875, 0.207855224609375, 0.27996826171875, 0.352081298828125, 0.4241943359375, 0.496307373046875, 0.56842041015625, 0.640533447265625, 0.712646484375, 0.784759521484375, 0.85687255859375, 0.928985595703125, 1.0010986328125, 1.073211669921875, 1.14532470703125, 1.217437744140625, 1.28955078125, 1.361663818359375, 1.43377685546875, 1.505889892578125, 1.5780029296875, 1.650115966796875, 1.72222900390625, 1.794342041015625, 1.866455078125, 1.938568115234375, 2.01068115234375, 2.082794189453125, 2.1549072265625, 2.227020263671875, 2.29913330078125, 2.371246337890625, 2.443359375]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 7.0, 6.0, 6.0, 11.0, 18.0, 13.0, 13.0, 24.0, 28.0, 30.0, 63.0, 56.0, 74.0, 73.0, 90.0, 86.0, 61.0, 75.0, 55.0, 48.0, 36.0, 32.0, 28.0, 23.0, 9.0, 10.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9609375, -1.902740478515625, -1.84454345703125, -1.786346435546875, -1.7281494140625, -1.669952392578125, -1.61175537109375, -1.553558349609375, -1.495361328125, -1.437164306640625, -1.37896728515625, -1.320770263671875, -1.2625732421875, -1.204376220703125, -1.14617919921875, -1.087982177734375, -1.02978515625, -0.971588134765625, -0.91339111328125, -0.855194091796875, -0.7969970703125, -0.738800048828125, -0.68060302734375, -0.622406005859375, -0.564208984375, -0.506011962890625, -0.44781494140625, -0.389617919921875, -0.3314208984375, -0.273223876953125, -0.21502685546875, -0.156829833984375, -0.0986328125, -0.040435791015625, 0.01776123046875, 0.075958251953125, 0.1341552734375, 0.192352294921875, 0.25054931640625, 0.308746337890625, 0.366943359375, 0.425140380859375, 0.48333740234375, 0.541534423828125, 0.5997314453125, 0.657928466796875, 0.71612548828125, 0.774322509765625, 0.83251953125, 0.890716552734375, 0.94891357421875, 1.007110595703125, 1.0653076171875, 1.123504638671875, 1.18170166015625, 1.239898681640625, 1.298095703125, 1.356292724609375, 1.41448974609375, 1.472686767578125, 1.5308837890625, 1.589080810546875, 1.64727783203125, 1.705474853515625, 1.763671875]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 10.0, 14.0, 30.0, 43.0, 78.0, 153.0, 373.0, 1494.0, 14406.0, 3061049.0, 1103870.0, 10856.0, 1247.0, 338.0, 149.0, 84.0, 26.0, 25.0, 14.0, 6.0, 6.0, 6.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.05078125, -4.85614013671875, -4.6614990234375, -4.46685791015625, -4.272216796875, -4.07757568359375, -3.8829345703125, -3.68829345703125, -3.49365234375, -3.29901123046875, -3.1043701171875, -2.90972900390625, -2.715087890625, -2.52044677734375, -2.3258056640625, -2.13116455078125, -1.9365234375, -1.74188232421875, -1.5472412109375, -1.35260009765625, -1.157958984375, -0.96331787109375, -0.7686767578125, -0.57403564453125, -0.37939453125, -0.18475341796875, 0.0098876953125, 0.20452880859375, 0.399169921875, 0.59381103515625, 0.7884521484375, 0.98309326171875, 1.177734375, 1.37237548828125, 1.5670166015625, 1.76165771484375, 1.956298828125, 2.15093994140625, 2.3455810546875, 2.54022216796875, 2.73486328125, 2.92950439453125, 3.1241455078125, 3.31878662109375, 3.513427734375, 3.70806884765625, 3.9027099609375, 4.09735107421875, 4.2919921875, 4.48663330078125, 4.6812744140625, 4.87591552734375, 5.070556640625, 5.26519775390625, 5.4598388671875, 5.65447998046875, 5.84912109375, 6.04376220703125, 6.2384033203125, 6.43304443359375, 6.627685546875, 6.82232666015625, 7.0169677734375, 7.21160888671875, 7.40625]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 10.0, 7.0, 6.0, 18.0, 18.0, 25.0, 36.0, 63.0, 60.0, 104.0, 164.0, 242.0, 363.0, 626.0, 944.0, 486.0, 295.0, 185.0, 111.0, 87.0, 64.0, 44.0, 40.0, 28.0, 21.0, 14.0, 4.0, 2.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.460205078125, -0.4404487609863281, -0.42069244384765625, -0.4009361267089844, -0.3811798095703125, -0.3614234924316406, -0.34166717529296875, -0.3219108581542969, -0.302154541015625, -0.2823982238769531, -0.26264190673828125, -0.24288558959960938, -0.2231292724609375, -0.20337295532226562, -0.18361663818359375, -0.16386032104492188, -0.14410400390625, -0.12434768676757812, -0.10459136962890625, -0.08483505249023438, -0.0650787353515625, -0.045322418212890625, -0.02556610107421875, -0.005809783935546875, 0.013946533203125, 0.033702850341796875, 0.05345916748046875, 0.07321548461914062, 0.0929718017578125, 0.11272811889648438, 0.13248443603515625, 0.15224075317382812, 0.1719970703125, 0.19175338745117188, 0.21150970458984375, 0.23126602172851562, 0.2510223388671875, 0.2707786560058594, 0.29053497314453125, 0.3102912902832031, 0.330047607421875, 0.3498039245605469, 0.36956024169921875, 0.3893165588378906, 0.4090728759765625, 0.4288291931152344, 0.44858551025390625, 0.4683418273925781, 0.48809814453125, 0.5078544616699219, 0.5276107788085938, 0.5473670959472656, 0.5671234130859375, 0.5868797302246094, 0.6066360473632812, 0.6263923645019531, 0.646148681640625, 0.6659049987792969, 0.6856613159179688, 0.7054176330566406, 0.7251739501953125, 0.7449302673339844, 0.7646865844726562, 0.7844429016113281, 0.80419921875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 8.0, 1.0, 7.0, 9.0, 13.0, 30.0, 58.0, 107.0, 155.0, 191.0, 179.0, 111.0, 47.0, 24.0, 19.0, 13.0, 11.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.780796527862549, -4.643094062805176, -4.505391597747803, -4.36768913269043, -4.229987144470215, -4.092284679412842, -3.9545822143554688, -3.8168797492980957, -3.6791772842407227, -3.5414748191833496, -3.4037725925445557, -3.2660701274871826, -3.1283676624298096, -2.9906654357910156, -2.8529629707336426, -2.7152605056762695, -2.5775582790374756, -2.4398558139801025, -2.3021535873413086, -2.1644511222839355, -2.0267486572265625, -1.889046311378479, -1.7513439655303955, -1.6136415004730225, -1.475939154624939, -1.3382368087768555, -1.2005343437194824, -1.062831997871399, -0.9251295924186707, -0.7874271869659424, -0.6497248411178589, -0.5120224356651306, -0.37432003021240234, -0.23661763966083527, -0.09891524910926819, 0.038787126541137695, 0.17648953199386597, 0.31419193744659424, 0.45189428329467773, 0.589596688747406, 0.7272990942001343, 0.8650014996528625, 1.0027039051055908, 1.1404062509536743, 1.2781085968017578, 1.4158110618591309, 1.5535134077072144, 1.6912157535552979, 1.828918218612671, 1.9666205644607544, 2.104322910308838, 2.242025375366211, 2.379727840423584, 2.517430305480957, 2.655132532119751, 2.792834997177124, 2.930537223815918, 3.068239688873291, 3.205941915512085, 3.343644380569458, 3.481346845626831, 3.619049072265625, 3.756751537322998, 3.894454002380371, 4.032156467437744]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 8.0, 8.0, 11.0, 16.0, 16.0, 20.0, 23.0, 17.0, 28.0, 43.0, 45.0, 46.0, 50.0, 50.0, 66.0, 65.0, 73.0, 70.0, 49.0, 55.0, 52.0, 37.0, 47.0, 20.0, 21.0, 12.0, 12.0, 7.0, 9.0, 3.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9663660526275635, -1.9075082540512085, -1.848650336265564, -1.789792537689209, -1.730934739112854, -1.6720768213272095, -1.6132190227508545, -1.55436110496521, -1.495503306388855, -1.4366455078125, -1.3777875900268555, -1.3189297914505005, -1.2600719928741455, -1.201214075088501, -1.142356276512146, -1.083498477935791, -1.0246405601501465, -0.9657827019691467, -0.9069249033927917, -0.848067045211792, -0.7892091870307922, -0.7303513288497925, -0.6714935302734375, -0.6126356720924377, -0.5537779331207275, -0.49492010474205017, -0.4360622465610504, -0.37720441818237305, -0.3183465600013733, -0.2594887316226959, -0.20063090324401855, -0.1417730450630188, -0.08291518688201904, -0.02405734732747078, 0.034800492227077484, 0.09365832805633545, 0.152516171336174, 0.21137401461601257, 0.27023184299468994, 0.3290897011756897, 0.38794752955436707, 0.44680535793304443, 0.5056632161140442, 0.564521074295044, 0.6233788728713989, 0.6822367310523987, 0.7410945892333984, 0.7999523878097534, 0.8588102459907532, 0.9176681041717529, 0.9765259027481079, 1.035383701324463, 1.0942416191101074, 1.1530994176864624, 1.2119572162628174, 1.270815134048462, 1.329672932624817, 1.3885307312011719, 1.4473886489868164, 1.5062464475631714, 1.5651042461395264, 1.623962163925171, 1.6828199625015259, 1.7416777610778809, 1.8005356788635254]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 6.0, 13.0, 14.0, 22.0, 34.0, 37.0, 84.0, 147.0, 306.0, 772.0, 2808.0, 26799.0, 950095.0, 61717.0, 4010.0, 929.0, 353.0, 162.0, 93.0, 63.0, 29.0, 20.0, 6.0, 12.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.43468475341796875, -0.4177093505859375, -0.40073394775390625, -0.383758544921875, -0.36678314208984375, -0.3498077392578125, -0.33283233642578125, -0.31585693359375, -0.29888153076171875, -0.2819061279296875, -0.26493072509765625, -0.247955322265625, -0.23097991943359375, -0.2140045166015625, -0.19702911376953125, -0.1800537109375, -0.16307830810546875, -0.1461029052734375, -0.12912750244140625, -0.112152099609375, -0.09517669677734375, -0.0782012939453125, -0.06122589111328125, -0.04425048828125, -0.02727508544921875, -0.0102996826171875, 0.00667572021484375, 0.023651123046875, 0.04062652587890625, 0.0576019287109375, 0.07457733154296875, 0.091552734375, 0.10852813720703125, 0.1255035400390625, 0.14247894287109375, 0.159454345703125, 0.17642974853515625, 0.1934051513671875, 0.21038055419921875, 0.22735595703125, 0.24433135986328125, 0.2613067626953125, 0.27828216552734375, 0.295257568359375, 0.31223297119140625, 0.3292083740234375, 0.34618377685546875, 0.3631591796875, 0.38013458251953125, 0.3971099853515625, 0.41408538818359375, 0.431060791015625, 0.44803619384765625, 0.4650115966796875, 0.48198699951171875, 0.49896240234375, 0.5159378051757812, 0.5329132080078125, 0.5498886108398438, 0.566864013671875, 0.5838394165039062, 0.6008148193359375, 0.6177902221679688, 0.634765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 10.0, 7.0, 22.0, 25.0, 31.0, 40.0, 61.0, 67.0, 68.0, 94.0, 97.0, 85.0, 108.0, 79.0, 69.0, 35.0, 31.0, 23.0, 12.0, 8.0, 4.0, 2.0, 9.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4453125, -1.388641357421875, -1.33197021484375, -1.275299072265625, -1.2186279296875, -1.161956787109375, -1.10528564453125, -1.048614501953125, -0.991943359375, -0.935272216796875, -0.87860107421875, -0.821929931640625, -0.7652587890625, -0.708587646484375, -0.65191650390625, -0.595245361328125, -0.53857421875, -0.481903076171875, -0.42523193359375, -0.368560791015625, -0.3118896484375, -0.255218505859375, -0.19854736328125, -0.141876220703125, -0.085205078125, -0.028533935546875, 0.02813720703125, 0.084808349609375, 0.1414794921875, 0.198150634765625, 0.25482177734375, 0.311492919921875, 0.3681640625, 0.424835205078125, 0.48150634765625, 0.538177490234375, 0.5948486328125, 0.651519775390625, 0.70819091796875, 0.764862060546875, 0.821533203125, 0.878204345703125, 0.93487548828125, 0.991546630859375, 1.0482177734375, 1.104888916015625, 1.16156005859375, 1.218231201171875, 1.27490234375, 1.331573486328125, 1.38824462890625, 1.444915771484375, 1.5015869140625, 1.558258056640625, 1.61492919921875, 1.671600341796875, 1.728271484375, 1.784942626953125, 1.84161376953125, 1.898284912109375, 1.9549560546875, 2.011627197265625, 2.06829833984375, 2.124969482421875, 2.181640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 5.0, 11.0, 5.0, 11.0, 13.0, 23.0, 20.0, 35.0, 40.0, 52.0, 74.0, 96.0, 127.0, 193.0, 269.0, 460.0, 1162.0, 5670.0, 46211.0, 597988.0, 363835.0, 26731.0, 3394.0, 824.0, 442.0, 249.0, 152.0, 117.0, 85.0, 70.0, 57.0, 29.0, 23.0, 24.0, 11.0, 16.0, 6.0, 3.0, 5.0, 4.0, 5.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.191162109375, -0.18552207946777344, -0.17988204956054688, -0.1742420196533203, -0.16860198974609375, -0.1629619598388672, -0.15732192993164062, -0.15168190002441406, -0.1460418701171875, -0.14040184020996094, -0.13476181030273438, -0.1291217803955078, -0.12348175048828125, -0.11784172058105469, -0.11220169067382812, -0.10656166076660156, -0.100921630859375, -0.09528160095214844, -0.08964157104492188, -0.08400154113769531, -0.07836151123046875, -0.07272148132324219, -0.06708145141601562, -0.06144142150878906, -0.0558013916015625, -0.05016136169433594, -0.044521331787109375, -0.03888130187988281, -0.03324127197265625, -0.027601242065429688, -0.021961212158203125, -0.016321182250976562, -0.01068115234375, -0.0050411224365234375, 0.000598907470703125, 0.0062389373779296875, 0.01187896728515625, 0.017518997192382812, 0.023159027099609375, 0.028799057006835938, 0.0344390869140625, 0.04007911682128906, 0.045719146728515625, 0.05135917663574219, 0.05699920654296875, 0.06263923645019531, 0.06827926635742188, 0.07391929626464844, 0.079559326171875, 0.08519935607910156, 0.09083938598632812, 0.09647941589355469, 0.10211944580078125, 0.10775947570800781, 0.11339950561523438, 0.11903953552246094, 0.1246795654296875, 0.13031959533691406, 0.13595962524414062, 0.1415996551513672, 0.14723968505859375, 0.1528797149658203, 0.15851974487304688, 0.16415977478027344, 0.1697998046875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 9.0, 10.0, 7.0, 18.0, 17.0, 13.0, 18.0, 22.0, 24.0, 19.0, 29.0, 26.0, 38.0, 34.0, 42.0, 44.0, 46.0, 56.0, 55.0, 58.0, 35.0, 41.0, 45.0, 31.0, 34.0, 40.0, 31.0, 27.0, 16.0, 19.0, 14.0, 15.0, 12.0, 13.0, 10.0, 6.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.962890625, -1.909149169921875, -1.85540771484375, -1.801666259765625, -1.7479248046875, -1.694183349609375, -1.64044189453125, -1.586700439453125, -1.532958984375, -1.479217529296875, -1.42547607421875, -1.371734619140625, -1.3179931640625, -1.264251708984375, -1.21051025390625, -1.156768798828125, -1.10302734375, -1.049285888671875, -0.99554443359375, -0.941802978515625, -0.8880615234375, -0.834320068359375, -0.78057861328125, -0.726837158203125, -0.673095703125, -0.619354248046875, -0.56561279296875, -0.511871337890625, -0.4581298828125, -0.404388427734375, -0.35064697265625, -0.296905517578125, -0.2431640625, -0.189422607421875, -0.13568115234375, -0.081939697265625, -0.0281982421875, 0.025543212890625, 0.07928466796875, 0.133026123046875, 0.186767578125, 0.240509033203125, 0.29425048828125, 0.347991943359375, 0.4017333984375, 0.455474853515625, 0.50921630859375, 0.562957763671875, 0.61669921875, 0.670440673828125, 0.72418212890625, 0.777923583984375, 0.8316650390625, 0.885406494140625, 0.93914794921875, 0.992889404296875, 1.046630859375, 1.100372314453125, 1.15411376953125, 1.207855224609375, 1.2615966796875, 1.315338134765625, 1.36907958984375, 1.422821044921875, 1.4765625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 6.0, 9.0, 8.0, 8.0, 9.0, 15.0, 10.0, 20.0, 26.0, 21.0, 39.0, 41.0, 53.0, 77.0, 113.0, 192.0, 303.0, 518.0, 1234.0, 3829.0, 19226.0, 562803.0, 436929.0, 16821.0, 3601.0, 1147.0, 545.0, 299.0, 190.0, 126.0, 89.0, 42.0, 35.0, 25.0, 25.0, 18.0, 20.0, 14.0, 17.0, 14.0, 10.0, 7.0, 7.0, 4.0, 6.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030059814453125, -0.029022216796875, -0.027984619140625, -0.026947021484375, -0.025909423828125, -0.024871826171875, -0.023834228515625, -0.022796630859375, -0.021759033203125, -0.020721435546875, -0.019683837890625, -0.018646240234375, -0.017608642578125, -0.016571044921875, -0.015533447265625, -0.014495849609375, -0.013458251953125, -0.012420654296875, -0.011383056640625, -0.010345458984375, -0.009307861328125, -0.008270263671875, -0.007232666015625, -0.006195068359375, -0.005157470703125, -0.004119873046875, -0.003082275390625, -0.002044677734375, -0.001007080078125, 3.0517578125e-05, 0.001068115234375, 0.002105712890625, 0.003143310546875, 0.004180908203125, 0.005218505859375, 0.006256103515625, 0.007293701171875, 0.008331298828125, 0.009368896484375, 0.010406494140625, 0.011444091796875, 0.012481689453125, 0.013519287109375, 0.014556884765625, 0.015594482421875, 0.016632080078125, 0.017669677734375, 0.018707275390625, 0.019744873046875, 0.020782470703125, 0.021820068359375, 0.022857666015625, 0.023895263671875, 0.024932861328125, 0.025970458984375, 0.027008056640625, 0.028045654296875, 0.029083251953125, 0.030120849609375, 0.031158447265625, 0.032196044921875, 0.033233642578125, 0.034271240234375, 0.035308837890625, 0.036346435546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 10.0, 19.0, 13.0, 28.0, 49.0, 64.0, 73.0, 84.0, 97.0, 111.0, 95.0, 102.0, 68.0, 49.0, 46.0, 29.0, 13.0, 14.0, 9.0, 8.0, 3.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8656253814697266e-05, -1.814216375350952e-05, -1.7628073692321777e-05, -1.7113983631134033e-05, -1.659989356994629e-05, -1.6085803508758545e-05, -1.55717134475708e-05, -1.5057623386383057e-05, -1.4543533325195312e-05, -1.4029443264007568e-05, -1.3515353202819824e-05, -1.300126314163208e-05, -1.2487173080444336e-05, -1.1973083019256592e-05, -1.1458992958068848e-05, -1.0944902896881104e-05, -1.043081283569336e-05, -9.916722774505615e-06, -9.402632713317871e-06, -8.888542652130127e-06, -8.374452590942383e-06, -7.860362529754639e-06, -7.3462724685668945e-06, -6.83218240737915e-06, -6.318092346191406e-06, -5.804002285003662e-06, -5.289912223815918e-06, -4.775822162628174e-06, -4.26173210144043e-06, -3.7476420402526855e-06, -3.2335519790649414e-06, -2.7194619178771973e-06, -2.205371856689453e-06, -1.691281795501709e-06, -1.1771917343139648e-06, -6.631016731262207e-07, -1.4901161193847656e-07, 3.650784492492676e-07, 8.791685104370117e-07, 1.3932585716247559e-06, 1.9073486328125e-06, 2.421438694000244e-06, 2.9355287551879883e-06, 3.4496188163757324e-06, 3.9637088775634766e-06, 4.477798938751221e-06, 4.991888999938965e-06, 5.505979061126709e-06, 6.020069122314453e-06, 6.534159183502197e-06, 7.048249244689941e-06, 7.5623393058776855e-06, 8.07642936706543e-06, 8.590519428253174e-06, 9.104609489440918e-06, 9.618699550628662e-06, 1.0132789611816406e-05, 1.064687967300415e-05, 1.1160969734191895e-05, 1.1675059795379639e-05, 1.2189149856567383e-05, 1.2703239917755127e-05, 1.3217329978942871e-05, 1.3731420040130615e-05, 1.424551010131836e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 11.0, 7.0, 8.0, 33.0, 30.0, 50.0, 80.0, 123.0, 191.0, 340.0, 617.0, 1099.0, 2134.0, 4577.0, 10771.0, 33495.0, 171331.0, 682706.0, 101001.0, 23859.0, 8523.0, 3696.0, 1701.0, 875.0, 484.0, 279.0, 190.0, 111.0, 65.0, 59.0, 27.0, 22.0, 20.0, 14.0, 9.0, 6.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0268402099609375, -0.026035785675048828, -0.025231361389160156, -0.024426937103271484, -0.023622512817382812, -0.02281808853149414, -0.02201366424560547, -0.021209239959716797, -0.020404815673828125, -0.019600391387939453, -0.01879596710205078, -0.01799154281616211, -0.017187118530273438, -0.016382694244384766, -0.015578269958496094, -0.014773845672607422, -0.01396942138671875, -0.013164997100830078, -0.012360572814941406, -0.011556148529052734, -0.010751724243164062, -0.00994729995727539, -0.009142875671386719, -0.008338451385498047, -0.007534027099609375, -0.006729602813720703, -0.005925178527832031, -0.005120754241943359, -0.0043163299560546875, -0.0035119056701660156, -0.0027074813842773438, -0.0019030570983886719, -0.0010986328125, -0.0002942085266113281, 0.0005102157592773438, 0.0013146400451660156, 0.0021190643310546875, 0.0029234886169433594, 0.0037279129028320312, 0.004532337188720703, 0.005336761474609375, 0.006141185760498047, 0.006945610046386719, 0.007750034332275391, 0.008554458618164062, 0.009358882904052734, 0.010163307189941406, 0.010967731475830078, 0.01177215576171875, 0.012576580047607422, 0.013381004333496094, 0.014185428619384766, 0.014989852905273438, 0.01579427719116211, 0.01659870147705078, 0.017403125762939453, 0.018207550048828125, 0.019011974334716797, 0.01981639862060547, 0.02062082290649414, 0.021425247192382812, 0.022229671478271484, 0.023034095764160156, 0.023838520050048828, 0.0246429443359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 11.0, 15.0, 13.0, 16.0, 24.0, 50.0, 63.0, 97.0, 135.0, 176.0, 124.0, 89.0, 49.0, 24.0, 23.0, 14.0, 9.0, 14.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.00612640380859375, -0.005957841873168945, -0.005789279937744141, -0.005620718002319336, -0.005452156066894531, -0.0052835941314697266, -0.005115032196044922, -0.004946470260620117, -0.0047779083251953125, -0.004609346389770508, -0.004440784454345703, -0.0042722225189208984, -0.004103660583496094, -0.003935098648071289, -0.0037665367126464844, -0.0035979747772216797, -0.003429412841796875, -0.0032608509063720703, -0.0030922889709472656, -0.002923727035522461, -0.0027551651000976562, -0.0025866031646728516, -0.002418041229248047, -0.002249479293823242, -0.0020809173583984375, -0.0019123554229736328, -0.0017437934875488281, -0.0015752315521240234, -0.0014066696166992188, -0.001238107681274414, -0.0010695457458496094, -0.0009009838104248047, -0.000732421875, -0.0005638599395751953, -0.0003952980041503906, -0.00022673606872558594, -5.817413330078125e-05, 0.00011038780212402344, 0.0002789497375488281, 0.0004475116729736328, 0.0006160736083984375, 0.0007846355438232422, 0.0009531974792480469, 0.0011217594146728516, 0.0012903213500976562, 0.001458883285522461, 0.0016274452209472656, 0.0017960071563720703, 0.001964569091796875, 0.0021331310272216797, 0.0023016929626464844, 0.002470254898071289, 0.0026388168334960938, 0.0028073787689208984, 0.002975940704345703, 0.003144502639770508, 0.0033130645751953125, 0.003481626510620117, 0.003650188446044922, 0.0038187503814697266, 0.003987312316894531, 0.004155874252319336, 0.004324436187744141, 0.004492998123168945, 0.00466156005859375]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 5.0, 9.0, 25.0, 45.0, 79.0, 164.0, 229.0, 204.0, 105.0, 50.0, 22.0, 13.0, 13.0, 10.0, 8.0, 7.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.93825101852417, -2.839751720428467, -2.7412524223327637, -2.6427531242370605, -2.5442538261413574, -2.4457545280456543, -2.347255229949951, -2.248755931854248, -2.150256633758545, -2.051757335662842, -1.9532580375671387, -1.8547587394714355, -1.7562594413757324, -1.6577601432800293, -1.5592607259750366, -1.4607614278793335, -1.3622620105743408, -1.2637627124786377, -1.1652634143829346, -1.0667641162872314, -0.9682647585868835, -0.8697654604911804, -0.7712661027908325, -0.6727668046951294, -0.5742675065994263, -0.47576820850372314, -0.37726888060569763, -0.2787695527076721, -0.180270254611969, -0.08177095651626587, 0.01672840118408203, 0.11522769927978516, 0.21372723579406738, 0.3122265338897705, 0.410725861787796, 0.5092251896858215, 0.6077244877815247, 0.7062237858772278, 0.8047231435775757, 0.9032224416732788, 1.001721739768982, 1.100221037864685, 1.1987203359603882, 1.2972197532653809, 1.395719051361084, 1.494218349456787, 1.5927176475524902, 1.6912169456481934, 1.7897162437438965, 1.8882155418395996, 1.9867148399353027, 2.085214138031006, 2.183713436126709, 2.282212734222412, 2.3807120323181152, 2.4792113304138184, 2.5777106285095215, 2.6762099266052246, 2.7747092247009277, 2.873208522796631, 2.971707820892334, 3.070207118988037, 3.1687064170837402, 3.2672057151794434, 3.3657052516937256]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 7.0, 2.0, 12.0, 13.0, 12.0, 19.0, 21.0, 24.0, 28.0, 54.0, 58.0, 53.0, 69.0, 80.0, 92.0, 94.0, 74.0, 75.0, 51.0, 48.0, 36.0, 19.0, 14.0, 10.0, 12.0, 7.0, 2.0, 4.0, 7.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4401131868362427, -1.3941035270690918, -1.3480939865112305, -1.3020843267440796, -1.2560747861862183, -1.2100651264190674, -1.164055585861206, -1.1180459260940552, -1.0720362663269043, -1.0260266065597534, -0.9800170660018921, -0.9340074062347412, -0.8879978656768799, -0.841988205909729, -0.7959786057472229, -0.7499690055847168, -0.7039594650268555, -0.6579498648643494, -0.6119402647018433, -0.5659306049346924, -0.519921064376831, -0.47391143441200256, -0.4279018044471741, -0.38189220428466797, -0.33588260412216187, -0.28987300395965576, -0.24386338889598846, -0.19785377383232117, -0.15184417366981506, -0.10583457350730896, -0.05982494354248047, -0.013815343379974365, 0.03219437599182129, 0.07820398360490799, 0.12421359121799469, 0.170223206281662, 0.2162328064441681, 0.2622424066066742, 0.3082520365715027, 0.3542616367340088, 0.4002712368965149, 0.446280837059021, 0.4922904372215271, 0.5383000373840332, 0.5843096971511841, 0.6303192377090454, 0.6763288974761963, 0.7223384976387024, 0.7683480978012085, 0.8143576979637146, 0.8603672981262207, 0.9063769578933716, 0.9523864984512329, 0.9983961582183838, 1.0444056987762451, 1.090415358543396, 1.1364250183105469, 1.1824346780776978, 1.228444218635559, 1.27445387840271, 1.3204634189605713, 1.3664730787277222, 1.412482738494873, 1.4584922790527344, 1.5045018196105957]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 10.0, 8.0, 12.0, 17.0, 30.0, 73.0, 135.0, 212.0, 342.0, 744.0, 1424.0, 3083.0, 7779.0, 24320.0, 113275.0, 606281.0, 230784.0, 40395.0, 11503.0, 4286.0, 1842.0, 930.0, 459.0, 273.0, 131.0, 83.0, 47.0, 27.0, 16.0, 10.0, 6.0, 4.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.00390625, -1.9385986328125, -1.873291015625, -1.8079833984375, -1.74267578125, -1.6773681640625, -1.612060546875, -1.5467529296875, -1.4814453125, -1.4161376953125, -1.350830078125, -1.2855224609375, -1.22021484375, -1.1549072265625, -1.089599609375, -1.0242919921875, -0.958984375, -0.8936767578125, -0.828369140625, -0.7630615234375, -0.69775390625, -0.6324462890625, -0.567138671875, -0.5018310546875, -0.4365234375, -0.3712158203125, -0.305908203125, -0.2406005859375, -0.17529296875, -0.1099853515625, -0.044677734375, 0.0206298828125, 0.0859375, 0.1512451171875, 0.216552734375, 0.2818603515625, 0.34716796875, 0.4124755859375, 0.477783203125, 0.5430908203125, 0.6083984375, 0.6737060546875, 0.739013671875, 0.8043212890625, 0.86962890625, 0.9349365234375, 1.000244140625, 1.0655517578125, 1.130859375, 1.1961669921875, 1.261474609375, 1.3267822265625, 1.39208984375, 1.4573974609375, 1.522705078125, 1.5880126953125, 1.6533203125, 1.7186279296875, 1.783935546875, 1.8492431640625, 1.91455078125, 1.9798583984375, 2.045166015625, 2.1104736328125, 2.17578125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 8.0, 9.0, 19.0, 8.0, 24.0, 29.0, 31.0, 47.0, 57.0, 53.0, 58.0, 84.0, 94.0, 71.0, 82.0, 60.0, 52.0, 52.0, 28.0, 24.0, 19.0, 26.0, 11.0, 10.0, 4.0, 7.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.763671875, -2.676025390625, -2.58837890625, -2.500732421875, -2.4130859375, -2.325439453125, -2.23779296875, -2.150146484375, -2.0625, -1.974853515625, -1.88720703125, -1.799560546875, -1.7119140625, -1.624267578125, -1.53662109375, -1.448974609375, -1.361328125, -1.273681640625, -1.18603515625, -1.098388671875, -1.0107421875, -0.923095703125, -0.83544921875, -0.747802734375, -0.66015625, -0.572509765625, -0.48486328125, -0.397216796875, -0.3095703125, -0.221923828125, -0.13427734375, -0.046630859375, 0.041015625, 0.128662109375, 0.21630859375, 0.303955078125, 0.3916015625, 0.479248046875, 0.56689453125, 0.654541015625, 0.7421875, 0.829833984375, 0.91748046875, 1.005126953125, 1.0927734375, 1.180419921875, 1.26806640625, 1.355712890625, 1.443359375, 1.531005859375, 1.61865234375, 1.706298828125, 1.7939453125, 1.881591796875, 1.96923828125, 2.056884765625, 2.14453125, 2.232177734375, 2.31982421875, 2.407470703125, 2.4951171875, 2.582763671875, 2.67041015625, 2.758056640625, 2.845703125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 3.0, 6.0, 10.0, 4.0, 5.0, 8.0, 11.0, 15.0, 13.0, 20.0, 22.0, 27.0, 31.0, 26.0, 35.0, 41.0, 73.0, 110.0, 379.0, 1660.0, 21708.0, 963645.0, 56909.0, 2740.0, 477.0, 148.0, 77.0, 48.0, 45.0, 30.0, 37.0, 22.0, 21.0, 18.0, 18.0, 19.0, 12.0, 10.0, 8.0, 14.0, 7.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.578125, -5.39593505859375, -5.2137451171875, -5.03155517578125, -4.849365234375, -4.66717529296875, -4.4849853515625, -4.30279541015625, -4.12060546875, -3.93841552734375, -3.7562255859375, -3.57403564453125, -3.391845703125, -3.20965576171875, -3.0274658203125, -2.84527587890625, -2.6630859375, -2.48089599609375, -2.2987060546875, -2.11651611328125, -1.934326171875, -1.75213623046875, -1.5699462890625, -1.38775634765625, -1.20556640625, -1.02337646484375, -0.8411865234375, -0.65899658203125, -0.476806640625, -0.29461669921875, -0.1124267578125, 0.06976318359375, 0.251953125, 0.43414306640625, 0.6163330078125, 0.79852294921875, 0.980712890625, 1.16290283203125, 1.3450927734375, 1.52728271484375, 1.70947265625, 1.89166259765625, 2.0738525390625, 2.25604248046875, 2.438232421875, 2.62042236328125, 2.8026123046875, 2.98480224609375, 3.1669921875, 3.34918212890625, 3.5313720703125, 3.71356201171875, 3.895751953125, 4.07794189453125, 4.2601318359375, 4.44232177734375, 4.62451171875, 4.80670166015625, 4.9888916015625, 5.17108154296875, 5.353271484375, 5.53546142578125, 5.7176513671875, 5.89984130859375, 6.08203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 5.0, 4.0, 7.0, 4.0, 7.0, 9.0, 8.0, 9.0, 10.0, 11.0, 20.0, 17.0, 13.0, 28.0, 26.0, 28.0, 42.0, 33.0, 36.0, 42.0, 44.0, 33.0, 36.0, 38.0, 32.0, 35.0, 31.0, 39.0, 44.0, 38.0, 41.0, 35.0, 28.0, 21.0, 25.0, 19.0, 15.0, 14.0, 9.0, 12.0, 18.0, 6.0, 5.0, 6.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-1.916015625, -1.8549346923828125, -1.793853759765625, -1.7327728271484375, -1.67169189453125, -1.6106109619140625, -1.549530029296875, -1.4884490966796875, -1.4273681640625, -1.3662872314453125, -1.305206298828125, -1.2441253662109375, -1.18304443359375, -1.1219635009765625, -1.060882568359375, -0.9998016357421875, -0.938720703125, -0.8776397705078125, -0.816558837890625, -0.7554779052734375, -0.69439697265625, -0.6333160400390625, -0.572235107421875, -0.5111541748046875, -0.4500732421875, -0.3889923095703125, -0.327911376953125, -0.2668304443359375, -0.20574951171875, -0.1446685791015625, -0.083587646484375, -0.0225067138671875, 0.03857421875, 0.0996551513671875, 0.160736083984375, 0.2218170166015625, 0.28289794921875, 0.3439788818359375, 0.405059814453125, 0.4661407470703125, 0.5272216796875, 0.5883026123046875, 0.649383544921875, 0.7104644775390625, 0.77154541015625, 0.8326263427734375, 0.893707275390625, 0.9547882080078125, 1.015869140625, 1.0769500732421875, 1.138031005859375, 1.1991119384765625, 1.26019287109375, 1.3212738037109375, 1.382354736328125, 1.4434356689453125, 1.5045166015625, 1.5655975341796875, 1.626678466796875, 1.6877593994140625, 1.74884033203125, 1.8099212646484375, 1.871002197265625, 1.9320831298828125, 1.9931640625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 9.0, 7.0, 19.0, 26.0, 48.0, 61.0, 86.0, 169.0, 327.0, 766.0, 1695.0, 4989.0, 18542.0, 113749.0, 678536.0, 192128.0, 26865.0, 6600.0, 2127.0, 860.0, 391.0, 234.0, 110.0, 68.0, 47.0, 31.0, 17.0, 13.0, 11.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.662872314453125, -0.63970947265625, -0.616546630859375, -0.5933837890625, -0.570220947265625, -0.54705810546875, -0.523895263671875, -0.500732421875, -0.477569580078125, -0.45440673828125, -0.431243896484375, -0.4080810546875, -0.384918212890625, -0.36175537109375, -0.338592529296875, -0.3154296875, -0.292266845703125, -0.26910400390625, -0.245941162109375, -0.2227783203125, -0.199615478515625, -0.17645263671875, -0.153289794921875, -0.130126953125, -0.106964111328125, -0.08380126953125, -0.060638427734375, -0.0374755859375, -0.014312744140625, 0.00885009765625, 0.032012939453125, 0.05517578125, 0.078338623046875, 0.10150146484375, 0.124664306640625, 0.1478271484375, 0.170989990234375, 0.19415283203125, 0.217315673828125, 0.240478515625, 0.263641357421875, 0.28680419921875, 0.309967041015625, 0.3331298828125, 0.356292724609375, 0.37945556640625, 0.402618408203125, 0.42578125, 0.448944091796875, 0.47210693359375, 0.495269775390625, 0.5184326171875, 0.541595458984375, 0.56475830078125, 0.587921142578125, 0.611083984375, 0.634246826171875, 0.65740966796875, 0.680572509765625, 0.7037353515625, 0.726898193359375, 0.75006103515625, 0.773223876953125, 0.79638671875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 8.0, 14.0, 27.0, 30.0, 27.0, 39.0, 66.0, 83.0, 86.0, 90.0, 113.0, 99.0, 61.0, 66.0, 40.0, 40.0, 26.0, 24.0, 17.0, 10.0, 11.0, 4.0, 8.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012195110321044922, -0.00011875759810209274, -0.00011556409299373627, -0.00011237058788537979, -0.00010917708277702332, -0.00010598357766866684, -0.00010279007256031036, -9.959656745195389e-05, -9.640306234359741e-05, -9.320955723524094e-05, -9.001605212688446e-05, -8.682254701852798e-05, -8.362904191017151e-05, -8.043553680181503e-05, -7.724203169345856e-05, -7.404852658510208e-05, -7.08550214767456e-05, -6.766151636838913e-05, -6.446801126003265e-05, -6.127450615167618e-05, -5.80810010433197e-05, -5.4887495934963226e-05, -5.169399082660675e-05, -4.8500485718250275e-05, -4.53069806098938e-05, -4.211347550153732e-05, -3.891997039318085e-05, -3.572646528482437e-05, -3.2532960176467896e-05, -2.933945506811142e-05, -2.6145949959754944e-05, -2.2952444851398468e-05, -1.9758939743041992e-05, -1.6565434634685516e-05, -1.337192952632904e-05, -1.0178424417972565e-05, -6.984919309616089e-06, -3.791414201259613e-06, -5.979090929031372e-07, 2.5955960154533386e-06, 5.7891011238098145e-06, 8.98260623216629e-06, 1.2176111340522766e-05, 1.5369616448879242e-05, 1.8563121557235718e-05, 2.1756626665592194e-05, 2.495013177394867e-05, 2.8143636882305145e-05, 3.133714199066162e-05, 3.45306470990181e-05, 3.772415220737457e-05, 4.091765731573105e-05, 4.4111162424087524e-05, 4.7304667532444e-05, 5.0498172640800476e-05, 5.369167774915695e-05, 5.688518285751343e-05, 6.0078687965869904e-05, 6.327219307422638e-05, 6.646569818258286e-05, 6.965920329093933e-05, 7.285270839929581e-05, 7.604621350765228e-05, 7.923971861600876e-05, 8.243322372436523e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 7.0, 10.0, 8.0, 11.0, 10.0, 19.0, 21.0, 56.0, 94.0, 141.0, 338.0, 593.0, 1333.0, 3280.0, 9701.0, 36166.0, 192469.0, 603476.0, 156517.0, 30506.0, 8534.0, 2964.0, 1200.0, 513.0, 246.0, 138.0, 66.0, 50.0, 34.0, 18.0, 13.0, 9.0, 5.0, 0.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.537109375, -0.5188674926757812, -0.5006256103515625, -0.48238372802734375, -0.464141845703125, -0.44589996337890625, -0.4276580810546875, -0.40941619873046875, -0.39117431640625, -0.37293243408203125, -0.3546905517578125, -0.33644866943359375, -0.318206787109375, -0.29996490478515625, -0.2817230224609375, -0.26348114013671875, -0.2452392578125, -0.22699737548828125, -0.2087554931640625, -0.19051361083984375, -0.172271728515625, -0.15402984619140625, -0.1357879638671875, -0.11754608154296875, -0.09930419921875, -0.08106231689453125, -0.0628204345703125, -0.04457855224609375, -0.026336669921875, -0.00809478759765625, 0.0101470947265625, 0.02838897705078125, 0.046630859375, 0.06487274169921875, 0.0831146240234375, 0.10135650634765625, 0.119598388671875, 0.13784027099609375, 0.1560821533203125, 0.17432403564453125, 0.19256591796875, 0.21080780029296875, 0.2290496826171875, 0.24729156494140625, 0.265533447265625, 0.28377532958984375, 0.3020172119140625, 0.32025909423828125, 0.3385009765625, 0.35674285888671875, 0.3749847412109375, 0.39322662353515625, 0.411468505859375, 0.42971038818359375, 0.4479522705078125, 0.46619415283203125, 0.48443603515625, 0.5026779174804688, 0.5209197998046875, 0.5391616821289062, 0.557403564453125, 0.5756454467773438, 0.5938873291015625, 0.6121292114257812, 0.63037109375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 7.0, 8.0, 14.0, 18.0, 13.0, 22.0, 30.0, 35.0, 36.0, 34.0, 30.0, 61.0, 53.0, 52.0, 64.0, 69.0, 62.0, 63.0, 53.0, 43.0, 33.0, 30.0, 25.0, 25.0, 17.0, 13.0, 10.0, 9.0, 11.0, 8.0, 5.0, 6.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.2431640625, -0.23656272888183594, -0.22996139526367188, -0.2233600616455078, -0.21675872802734375, -0.2101573944091797, -0.20355606079101562, -0.19695472717285156, -0.1903533935546875, -0.18375205993652344, -0.17715072631835938, -0.1705493927001953, -0.16394805908203125, -0.1573467254638672, -0.15074539184570312, -0.14414405822753906, -0.137542724609375, -0.13094139099121094, -0.12434005737304688, -0.11773872375488281, -0.11113739013671875, -0.10453605651855469, -0.09793472290039062, -0.09133338928222656, -0.0847320556640625, -0.07813072204589844, -0.07152938842773438, -0.06492805480957031, -0.05832672119140625, -0.05172538757324219, -0.045124053955078125, -0.03852272033691406, -0.03192138671875, -0.025320053100585938, -0.018718719482421875, -0.012117385864257812, -0.00551605224609375, 0.0010852813720703125, 0.007686614990234375, 0.014287948608398438, 0.0208892822265625, 0.027490615844726562, 0.034091949462890625, 0.04069328308105469, 0.04729461669921875, 0.05389595031738281, 0.060497283935546875, 0.06709861755371094, 0.073699951171875, 0.08030128479003906, 0.08690261840820312, 0.09350395202636719, 0.10010528564453125, 0.10670661926269531, 0.11330795288085938, 0.11990928649902344, 0.1265106201171875, 0.13311195373535156, 0.13971328735351562, 0.1463146209716797, 0.15291595458984375, 0.1595172882080078, 0.16611862182617188, 0.17271995544433594, 0.1793212890625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 12.0, 26.0, 84.0, 316.0, 408.0, 110.0, 23.0, 17.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.892582893371582, -6.437861442565918, -5.983140468597412, -5.528419494628906, -5.073698043823242, -4.618976593017578, -4.164255619049072, -3.7095344066619873, -3.2548131942749023, -2.8000919818878174, -2.3453707695007324, -1.8906495571136475, -1.4359283447265625, -0.9812071323394775, -0.5264859199523926, -0.07176470756530762, 0.38295650482177734, 0.8376777172088623, 1.2923989295959473, 1.7471201419830322, 2.201841354370117, 2.656562566757202, 3.111283779144287, 3.566004991531372, 4.020726203918457, 4.475447654724121, 4.930168628692627, 5.384889602661133, 5.839611053466797, 6.294332504272461, 6.749053478240967, 7.203774452209473, 7.65849494934082, 8.113216400146484, 8.567937850952148, 9.022658348083496, 9.47737979888916, 9.932101249694824, 10.386821746826172, 10.841543197631836, 11.2962646484375, 11.750986099243164, 12.205707550048828, 12.660428047180176, 13.11514949798584, 13.569870948791504, 14.024591445922852, 14.479312896728516, 14.93403434753418, 15.388755798339844, 15.843477249145508, 16.298198699951172, 16.752918243408203, 17.207639694213867, 17.66236114501953, 18.117082595825195, 18.57180404663086, 19.026525497436523, 19.481246948242188, 19.93596839904785, 20.390689849853516, 20.845409393310547, 21.30013084411621, 21.754852294921875, 22.20957374572754]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 4.0, 7.0, 6.0, 7.0, 8.0, 15.0, 16.0, 11.0, 20.0, 28.0, 45.0, 40.0, 47.0, 47.0, 50.0, 74.0, 56.0, 48.0, 59.0, 55.0, 41.0, 53.0, 26.0, 33.0, 36.0, 31.0, 31.0, 22.0, 23.0, 12.0, 12.0, 8.0, 6.0, 5.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.718438625335693, -4.575350284576416, -4.432262420654297, -4.2891740798950195, -4.1460862159729, -4.002997875213623, -3.859910011291504, -3.7168216705322266, -3.5737338066101074, -3.430645704269409, -3.287557601928711, -3.1444694995880127, -3.0013813972473145, -2.858293294906616, -2.715205192565918, -2.5721168518066406, -2.4290287494659424, -2.285940647125244, -2.142852544784546, -1.9997644424438477, -1.8566763401031494, -1.7135882377624512, -1.5705000162124634, -1.4274119138717651, -1.284323811531067, -1.1412357091903687, -0.9981476068496704, -0.8550594449043274, -0.7119713425636292, -0.5688832402229309, -0.4257950782775879, -0.28270697593688965, -0.1396188735961914, 0.00346924364566803, 0.14655736088752747, 0.2896454930305481, 0.43273359537124634, 0.5758216977119446, 0.7189098596572876, 0.8619979619979858, 1.005086064338684, 1.1481741666793823, 1.2912622690200806, 1.4343504905700684, 1.5774385929107666, 1.7205266952514648, 1.863614797592163, 2.0067028999328613, 2.1497910022735596, 2.292879104614258, 2.435967206954956, 2.5790553092956543, 2.7221434116363525, 2.865231513977051, 3.008319854736328, 3.1514077186584473, 3.2944960594177246, 3.437584161758423, 3.580672264099121, 3.7237603664398193, 3.8668484687805176, 4.009936809539795, 4.153024673461914, 4.296113014221191, 4.4392008781433105]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 2.0, 9.0, 15.0, 15.0, 21.0, 18.0, 40.0, 43.0, 62.0, 103.0, 155.0, 207.0, 338.0, 591.0, 945.0, 1554.0, 3141.0, 6169.0, 13902.0, 35616.0, 118622.0, 730840.0, 2865417.0, 302421.0, 69202.0, 24076.0, 10072.0, 4760.0, 2445.0, 1361.0, 718.0, 454.0, 336.0, 196.0, 126.0, 81.0, 59.0, 37.0, 25.0, 27.0, 19.0, 12.0, 9.0, 5.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.544921875, -1.493927001953125, -1.44293212890625, -1.391937255859375, -1.3409423828125, -1.289947509765625, -1.23895263671875, -1.187957763671875, -1.136962890625, -1.085968017578125, -1.03497314453125, -0.983978271484375, -0.9329833984375, -0.881988525390625, -0.83099365234375, -0.779998779296875, -0.72900390625, -0.678009033203125, -0.62701416015625, -0.576019287109375, -0.5250244140625, -0.474029541015625, -0.42303466796875, -0.372039794921875, -0.321044921875, -0.270050048828125, -0.21905517578125, -0.168060302734375, -0.1170654296875, -0.066070556640625, -0.01507568359375, 0.035919189453125, 0.0869140625, 0.137908935546875, 0.18890380859375, 0.239898681640625, 0.2908935546875, 0.341888427734375, 0.39288330078125, 0.443878173828125, 0.494873046875, 0.545867919921875, 0.59686279296875, 0.647857666015625, 0.6988525390625, 0.749847412109375, 0.80084228515625, 0.851837158203125, 0.90283203125, 0.953826904296875, 1.00482177734375, 1.055816650390625, 1.1068115234375, 1.157806396484375, 1.20880126953125, 1.259796142578125, 1.310791015625, 1.361785888671875, 1.41278076171875, 1.463775634765625, 1.5147705078125, 1.565765380859375, 1.61676025390625, 1.667755126953125, 1.71875]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 6.0, 5.0, 5.0, 12.0, 17.0, 8.0, 21.0, 25.0, 32.0, 39.0, 52.0, 62.0, 56.0, 92.0, 89.0, 74.0, 73.0, 69.0, 50.0, 54.0, 33.0, 32.0, 22.0, 15.0, 10.0, 5.0, 10.0, 7.0, 7.0, 1.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.81640625, -1.7609100341796875, -1.705413818359375, -1.6499176025390625, -1.59442138671875, -1.5389251708984375, -1.483428955078125, -1.4279327392578125, -1.3724365234375, -1.3169403076171875, -1.261444091796875, -1.2059478759765625, -1.15045166015625, -1.0949554443359375, -1.039459228515625, -0.9839630126953125, -0.928466796875, -0.8729705810546875, -0.817474365234375, -0.7619781494140625, -0.70648193359375, -0.6509857177734375, -0.595489501953125, -0.5399932861328125, -0.4844970703125, -0.4290008544921875, -0.373504638671875, -0.3180084228515625, -0.26251220703125, -0.2070159912109375, -0.151519775390625, -0.0960235595703125, -0.04052734375, 0.0149688720703125, 0.070465087890625, 0.1259613037109375, 0.18145751953125, 0.2369537353515625, 0.292449951171875, 0.3479461669921875, 0.4034423828125, 0.4589385986328125, 0.514434814453125, 0.5699310302734375, 0.62542724609375, 0.6809234619140625, 0.736419677734375, 0.7919158935546875, 0.847412109375, 0.9029083251953125, 0.958404541015625, 1.0139007568359375, 1.06939697265625, 1.1248931884765625, 1.180389404296875, 1.2358856201171875, 1.2913818359375, 1.3468780517578125, 1.402374267578125, 1.4578704833984375, 1.51336669921875, 1.5688629150390625, 1.624359130859375, 1.6798553466796875, 1.7353515625]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 8.0, 6.0, 7.0, 13.0, 16.0, 19.0, 37.0, 45.0, 73.0, 132.0, 262.0, 779.0, 3527.0, 52043.0, 4013439.0, 116741.0, 5436.0, 978.0, 325.0, 163.0, 74.0, 53.0, 28.0, 18.0, 18.0, 11.0, 15.0, 4.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.78125, -5.60919189453125, -5.4371337890625, -5.26507568359375, -5.093017578125, -4.92095947265625, -4.7489013671875, -4.57684326171875, -4.40478515625, -4.23272705078125, -4.0606689453125, -3.88861083984375, -3.716552734375, -3.54449462890625, -3.3724365234375, -3.20037841796875, -3.0283203125, -2.85626220703125, -2.6842041015625, -2.51214599609375, -2.340087890625, -2.16802978515625, -1.9959716796875, -1.82391357421875, -1.65185546875, -1.47979736328125, -1.3077392578125, -1.13568115234375, -0.963623046875, -0.79156494140625, -0.6195068359375, -0.44744873046875, -0.275390625, -0.10333251953125, 0.0687255859375, 0.24078369140625, 0.412841796875, 0.58489990234375, 0.7569580078125, 0.92901611328125, 1.10107421875, 1.27313232421875, 1.4451904296875, 1.61724853515625, 1.789306640625, 1.96136474609375, 2.1334228515625, 2.30548095703125, 2.4775390625, 2.64959716796875, 2.8216552734375, 2.99371337890625, 3.165771484375, 3.33782958984375, 3.5098876953125, 3.68194580078125, 3.85400390625, 4.02606201171875, 4.1981201171875, 4.37017822265625, 4.542236328125, 4.71429443359375, 4.8863525390625, 5.05841064453125, 5.23046875]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 3.0, 3.0, 8.0, 7.0, 9.0, 10.0, 26.0, 26.0, 34.0, 56.0, 83.0, 92.0, 182.0, 252.0, 498.0, 1015.0, 748.0, 349.0, 216.0, 124.0, 106.0, 59.0, 51.0, 31.0, 17.0, 14.0, 13.0, 15.0, 5.0, 9.0, 4.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.464599609375, -0.4458808898925781, -0.42716217041015625, -0.4084434509277344, -0.3897247314453125, -0.3710060119628906, -0.35228729248046875, -0.3335685729980469, -0.314849853515625, -0.2961311340332031, -0.27741241455078125, -0.2586936950683594, -0.2399749755859375, -0.22125625610351562, -0.20253753662109375, -0.18381881713867188, -0.16510009765625, -0.14638137817382812, -0.12766265869140625, -0.10894393920898438, -0.0902252197265625, -0.07150650024414062, -0.05278778076171875, -0.034069061279296875, -0.015350341796875, 0.003368377685546875, 0.02208709716796875, 0.040805816650390625, 0.0595245361328125, 0.07824325561523438, 0.09696197509765625, 0.11568069458007812, 0.1343994140625, 0.15311813354492188, 0.17183685302734375, 0.19055557250976562, 0.2092742919921875, 0.22799301147460938, 0.24671173095703125, 0.2654304504394531, 0.284149169921875, 0.3028678894042969, 0.32158660888671875, 0.3403053283691406, 0.3590240478515625, 0.3777427673339844, 0.39646148681640625, 0.4151802062988281, 0.43389892578125, 0.4526176452636719, 0.47133636474609375, 0.4900550842285156, 0.5087738037109375, 0.5274925231933594, 0.5462112426757812, 0.5649299621582031, 0.583648681640625, 0.6023674011230469, 0.6210861206054688, 0.6398048400878906, 0.6585235595703125, 0.6772422790527344, 0.6959609985351562, 0.7146797180175781, 0.7333984375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 13.0, 9.0, 19.0, 46.0, 74.0, 145.0, 259.0, 212.0, 110.0, 48.0, 23.0, 17.0, 17.0, 8.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3715057373046875, -5.207652568817139, -5.04379940032959, -4.879946231842041, -4.716093063354492, -4.552239894866943, -4.3883867263793945, -4.224533557891846, -4.060680389404297, -3.896827220916748, -3.732974052429199, -3.5691208839416504, -3.4052677154541016, -3.2414145469665527, -3.077561378479004, -2.913708209991455, -2.7498550415039062, -2.5860018730163574, -2.4221487045288086, -2.2582955360412598, -2.094442367553711, -1.930589199066162, -1.7667360305786133, -1.6028828620910645, -1.4390296936035156, -1.2751765251159668, -1.111323356628418, -0.9474701881408691, -0.7836170196533203, -0.6197638511657715, -0.45591068267822266, -0.29205751419067383, -0.1282038688659668, 0.03564929962158203, 0.19950246810913086, 0.3633556365966797, 0.5272088050842285, 0.6910619735717773, 0.8549151420593262, 1.018768310546875, 1.1826214790344238, 1.3464746475219727, 1.5103278160095215, 1.6741809844970703, 1.8380341529846191, 2.001887321472168, 2.165740489959717, 2.3295936584472656, 2.4934468269348145, 2.6572999954223633, 2.821153163909912, 2.985006332397461, 3.1488595008850098, 3.3127126693725586, 3.4765658378601074, 3.6404190063476562, 3.804272174835205, 3.968125343322754, 4.131978511810303, 4.295831680297852, 4.4596848487854, 4.623538017272949, 4.787391185760498, 4.951244354248047, 5.115097522735596]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 9.0, 5.0, 8.0, 8.0, 9.0, 22.0, 25.0, 35.0, 46.0, 41.0, 41.0, 44.0, 72.0, 60.0, 78.0, 62.0, 59.0, 76.0, 51.0, 59.0, 48.0, 28.0, 24.0, 20.0, 17.0, 12.0, 10.0, 9.0, 4.0, 4.0, 4.0, 1.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.118955135345459, -2.05656099319458, -1.9941670894622803, -1.9317729473114014, -1.869378924369812, -1.8069849014282227, -1.7445908784866333, -1.682196855545044, -1.6198028326034546, -1.5574088096618652, -1.4950147867202759, -1.4326207637786865, -1.3702266216278076, -1.3078325986862183, -1.245438575744629, -1.1830445528030396, -1.1206505298614502, -1.0582565069198608, -0.9958624243736267, -0.9334684014320374, -0.871074378490448, -0.8086802959442139, -0.7462862730026245, -0.6838922500610352, -0.6214981079101562, -0.5591040849685669, -0.49671003222465515, -0.4343159794807434, -0.37192195653915405, -0.3095279037952423, -0.24713385105133057, -0.1847398281097412, -0.12234580516815186, -0.05995176360011101, 0.00244227796792984, 0.06483632326126099, 0.12723036110401154, 0.18962439894676208, 0.25201845169067383, 0.3144124746322632, 0.3768065273761749, 0.43920058012008667, 0.501594603061676, 0.5639886856079102, 0.6263827085494995, 0.6887767314910889, 0.7511707544326782, 0.8135647773742676, 0.8759588599205017, 0.9383528828620911, 1.0007469654083252, 1.0631409883499146, 1.125535011291504, 1.1879290342330933, 1.2503230571746826, 1.3127171993255615, 1.3751112222671509, 1.4375052452087402, 1.4998992681503296, 1.562293291091919, 1.6246874332427979, 1.6870814561843872, 1.7494754791259766, 1.811869502067566, 1.8742635250091553]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 4.0, 8.0, 6.0, 7.0, 16.0, 18.0, 28.0, 43.0, 68.0, 83.0, 166.0, 299.0, 625.0, 1354.0, 3629.0, 11930.0, 59285.0, 606501.0, 316325.0, 35193.0, 8148.0, 2600.0, 1076.0, 472.0, 267.0, 117.0, 95.0, 61.0, 39.0, 26.0, 18.0, 14.0, 11.0, 4.0, 6.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.17111587524414062, -0.16449737548828125, -0.15787887573242188, -0.1512603759765625, -0.14464187622070312, -0.13802337646484375, -0.13140487670898438, -0.124786376953125, -0.11816787719726562, -0.11154937744140625, -0.10493087768554688, -0.0983123779296875, -0.09169387817382812, -0.08507537841796875, -0.07845687866210938, -0.07183837890625, -0.06521987915039062, -0.05860137939453125, -0.051982879638671875, -0.0453643798828125, -0.038745880126953125, -0.03212738037109375, -0.025508880615234375, -0.018890380859375, -0.012271881103515625, -0.00565338134765625, 0.000965118408203125, 0.0075836181640625, 0.014202117919921875, 0.02082061767578125, 0.027439117431640625, 0.0340576171875, 0.040676116943359375, 0.04729461669921875, 0.053913116455078125, 0.0605316162109375, 0.06715011596679688, 0.07376861572265625, 0.08038711547851562, 0.087005615234375, 0.09362411499023438, 0.10024261474609375, 0.10686111450195312, 0.1134796142578125, 0.12009811401367188, 0.12671661376953125, 0.13333511352539062, 0.13995361328125, 0.14657211303710938, 0.15319061279296875, 0.15980911254882812, 0.1664276123046875, 0.17304611206054688, 0.17966461181640625, 0.18628311157226562, 0.192901611328125, 0.19952011108398438, 0.20613861083984375, 0.21275711059570312, 0.2193756103515625, 0.22599411010742188, 0.23261260986328125, 0.23923110961914062, 0.245849609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 5.0, 6.0, 14.0, 12.0, 17.0, 13.0, 35.0, 36.0, 41.0, 59.0, 53.0, 67.0, 70.0, 89.0, 73.0, 74.0, 66.0, 60.0, 47.0, 33.0, 25.0, 24.0, 15.0, 11.0, 7.0, 8.0, 9.0, 3.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6494140625, -1.6045074462890625, -1.559600830078125, -1.5146942138671875, -1.46978759765625, -1.4248809814453125, -1.379974365234375, -1.3350677490234375, -1.2901611328125, -1.2452545166015625, -1.200347900390625, -1.1554412841796875, -1.11053466796875, -1.0656280517578125, -1.020721435546875, -0.9758148193359375, -0.930908203125, -0.8860015869140625, -0.841094970703125, -0.7961883544921875, -0.75128173828125, -0.7063751220703125, -0.661468505859375, -0.6165618896484375, -0.5716552734375, -0.5267486572265625, -0.481842041015625, -0.4369354248046875, -0.39202880859375, -0.3471221923828125, -0.302215576171875, -0.2573089599609375, -0.21240234375, -0.1674957275390625, -0.122589111328125, -0.0776824951171875, -0.03277587890625, 0.0121307373046875, 0.057037353515625, 0.1019439697265625, 0.1468505859375, 0.1917572021484375, 0.236663818359375, 0.2815704345703125, 0.32647705078125, 0.3713836669921875, 0.416290283203125, 0.4611968994140625, 0.506103515625, 0.5510101318359375, 0.595916748046875, 0.6408233642578125, 0.68572998046875, 0.7306365966796875, 0.775543212890625, 0.8204498291015625, 0.8653564453125, 0.9102630615234375, 0.955169677734375, 1.0000762939453125, 1.04498291015625, 1.0898895263671875, 1.134796142578125, 1.1797027587890625, 1.224609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 11.0, 13.0, 3.0, 12.0, 12.0, 16.0, 31.0, 28.0, 27.0, 49.0, 57.0, 103.0, 136.0, 188.0, 347.0, 785.0, 3073.0, 18953.0, 235451.0, 720664.0, 58752.0, 7064.0, 1444.0, 486.0, 246.0, 155.0, 130.0, 71.0, 44.0, 52.0, 37.0, 30.0, 20.0, 13.0, 12.0, 8.0, 3.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1561279296875, -0.15039825439453125, -0.1446685791015625, -0.13893890380859375, -0.133209228515625, -0.12747955322265625, -0.1217498779296875, -0.11602020263671875, -0.11029052734375, -0.10456085205078125, -0.0988311767578125, -0.09310150146484375, -0.087371826171875, -0.08164215087890625, -0.0759124755859375, -0.07018280029296875, -0.064453125, -0.05872344970703125, -0.0529937744140625, -0.04726409912109375, -0.041534423828125, -0.03580474853515625, -0.0300750732421875, -0.02434539794921875, -0.01861572265625, -0.01288604736328125, -0.0071563720703125, -0.00142669677734375, 0.004302978515625, 0.01003265380859375, 0.0157623291015625, 0.02149200439453125, 0.0272216796875, 0.03295135498046875, 0.0386810302734375, 0.04441070556640625, 0.050140380859375, 0.05587005615234375, 0.0615997314453125, 0.06732940673828125, 0.07305908203125, 0.07878875732421875, 0.0845184326171875, 0.09024810791015625, 0.095977783203125, 0.10170745849609375, 0.1074371337890625, 0.11316680908203125, 0.118896484375, 0.12462615966796875, 0.1303558349609375, 0.13608551025390625, 0.141815185546875, 0.14754486083984375, 0.1532745361328125, 0.15900421142578125, 0.16473388671875, 0.17046356201171875, 0.1761932373046875, 0.18192291259765625, 0.187652587890625, 0.19338226318359375, 0.1991119384765625, 0.20484161376953125, 0.2105712890625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 4.0, 4.0, 3.0, 7.0, 6.0, 6.0, 6.0, 11.0, 13.0, 12.0, 18.0, 16.0, 12.0, 15.0, 30.0, 35.0, 38.0, 24.0, 40.0, 49.0, 57.0, 61.0, 57.0, 51.0, 42.0, 48.0, 42.0, 24.0, 33.0, 35.0, 29.0, 27.0, 23.0, 24.0, 24.0, 13.0, 14.0, 13.0, 12.0, 5.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.646484375, -1.5917816162109375, -1.537078857421875, -1.4823760986328125, -1.42767333984375, -1.3729705810546875, -1.318267822265625, -1.2635650634765625, -1.2088623046875, -1.1541595458984375, -1.099456787109375, -1.0447540283203125, -0.99005126953125, -0.9353485107421875, -0.880645751953125, -0.8259429931640625, -0.771240234375, -0.7165374755859375, -0.661834716796875, -0.6071319580078125, -0.55242919921875, -0.4977264404296875, -0.443023681640625, -0.3883209228515625, -0.3336181640625, -0.2789154052734375, -0.224212646484375, -0.1695098876953125, -0.11480712890625, -0.0601043701171875, -0.005401611328125, 0.0493011474609375, 0.10400390625, 0.1587066650390625, 0.213409423828125, 0.2681121826171875, 0.32281494140625, 0.3775177001953125, 0.432220458984375, 0.4869232177734375, 0.5416259765625, 0.5963287353515625, 0.651031494140625, 0.7057342529296875, 0.76043701171875, 0.8151397705078125, 0.869842529296875, 0.9245452880859375, 0.979248046875, 1.0339508056640625, 1.088653564453125, 1.1433563232421875, 1.19805908203125, 1.2527618408203125, 1.307464599609375, 1.3621673583984375, 1.4168701171875, 1.4715728759765625, 1.526275634765625, 1.5809783935546875, 1.63568115234375, 1.6903839111328125, 1.745086669921875, 1.7997894287109375, 1.8544921875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 2.0, 7.0, 4.0, 12.0, 13.0, 15.0, 25.0, 35.0, 37.0, 71.0, 136.0, 266.0, 914.0, 6450.0, 927073.0, 109246.0, 3126.0, 604.0, 219.0, 88.0, 57.0, 43.0, 29.0, 26.0, 15.0, 8.0, 6.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.088623046875, -0.08607959747314453, -0.08353614807128906, -0.0809926986694336, -0.07844924926757812, -0.07590579986572266, -0.07336235046386719, -0.07081890106201172, -0.06827545166015625, -0.06573200225830078, -0.06318855285644531, -0.060645103454589844, -0.058101654052734375, -0.055558204650878906, -0.05301475524902344, -0.05047130584716797, -0.0479278564453125, -0.04538440704345703, -0.04284095764160156, -0.040297508239746094, -0.037754058837890625, -0.035210609436035156, -0.03266716003417969, -0.03012371063232422, -0.02758026123046875, -0.02503681182861328, -0.022493362426757812, -0.019949913024902344, -0.017406463623046875, -0.014863014221191406, -0.012319564819335938, -0.009776115417480469, -0.007232666015625, -0.004689216613769531, -0.0021457672119140625, 0.00039768218994140625, 0.002941131591796875, 0.005484580993652344, 0.008028030395507812, 0.010571479797363281, 0.01311492919921875, 0.01565837860107422, 0.018201828002929688, 0.020745277404785156, 0.023288726806640625, 0.025832176208496094, 0.028375625610351562, 0.03091907501220703, 0.0334625244140625, 0.03600597381591797, 0.03854942321777344, 0.041092872619628906, 0.043636322021484375, 0.046179771423339844, 0.04872322082519531, 0.05126667022705078, 0.05381011962890625, 0.05635356903076172, 0.05889701843261719, 0.061440467834472656, 0.06398391723632812, 0.0665273666381836, 0.06907081604003906, 0.07161426544189453, 0.07415771484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 6.0, 5.0, 4.0, 9.0, 15.0, 23.0, 13.0, 32.0, 44.0, 68.0, 93.0, 120.0, 99.0, 134.0, 91.0, 70.0, 46.0, 32.0, 28.0, 16.0, 9.0, 12.0, 6.0, 7.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8358230590820312e-05, -1.7780810594558716e-05, -1.720339059829712e-05, -1.6625970602035522e-05, -1.6048550605773926e-05, -1.547113060951233e-05, -1.4893710613250732e-05, -1.4316290616989136e-05, -1.3738870620727539e-05, -1.3161450624465942e-05, -1.2584030628204346e-05, -1.2006610631942749e-05, -1.1429190635681152e-05, -1.0851770639419556e-05, -1.0274350643157959e-05, -9.696930646896362e-06, -9.119510650634766e-06, -8.542090654373169e-06, -7.964670658111572e-06, -7.387250661849976e-06, -6.809830665588379e-06, -6.232410669326782e-06, -5.6549906730651855e-06, -5.077570676803589e-06, -4.500150680541992e-06, -3.9227306842803955e-06, -3.345310688018799e-06, -2.767890691757202e-06, -2.1904706954956055e-06, -1.6130506992340088e-06, -1.0356307029724121e-06, -4.5821070671081543e-07, 1.1920928955078125e-07, 6.966292858123779e-07, 1.2740492820739746e-06, 1.8514692783355713e-06, 2.428889274597168e-06, 3.0063092708587646e-06, 3.5837292671203613e-06, 4.161149263381958e-06, 4.738569259643555e-06, 5.315989255905151e-06, 5.893409252166748e-06, 6.470829248428345e-06, 7.048249244689941e-06, 7.625669240951538e-06, 8.203089237213135e-06, 8.780509233474731e-06, 9.357929229736328e-06, 9.935349225997925e-06, 1.0512769222259521e-05, 1.1090189218521118e-05, 1.1667609214782715e-05, 1.2245029211044312e-05, 1.2822449207305908e-05, 1.3399869203567505e-05, 1.3977289199829102e-05, 1.4554709196090698e-05, 1.5132129192352295e-05, 1.570954918861389e-05, 1.6286969184875488e-05, 1.6864389181137085e-05, 1.744180917739868e-05, 1.801922917366028e-05, 1.8596649169921875e-05]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 11.0, 11.0, 23.0, 22.0, 49.0, 89.0, 139.0, 301.0, 696.0, 2064.0, 9789.0, 355052.0, 665197.0, 11531.0, 2176.0, 716.0, 320.0, 166.0, 80.0, 51.0, 20.0, 15.0, 8.0, 8.0, 6.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08935546875, -0.08680534362792969, -0.08425521850585938, -0.08170509338378906, -0.07915496826171875, -0.07660484313964844, -0.07405471801757812, -0.07150459289550781, -0.0689544677734375, -0.06640434265136719, -0.06385421752929688, -0.06130409240722656, -0.05875396728515625, -0.05620384216308594, -0.053653717041015625, -0.05110359191894531, -0.048553466796875, -0.04600334167480469, -0.043453216552734375, -0.04090309143066406, -0.03835296630859375, -0.03580284118652344, -0.033252716064453125, -0.030702590942382812, -0.0281524658203125, -0.025602340698242188, -0.023052215576171875, -0.020502090454101562, -0.01795196533203125, -0.015401840209960938, -0.012851715087890625, -0.010301589965820312, -0.00775146484375, -0.0052013397216796875, -0.002651214599609375, -0.0001010894775390625, 0.00244903564453125, 0.0049991607666015625, 0.007549285888671875, 0.010099411010742188, 0.0126495361328125, 0.015199661254882812, 0.017749786376953125, 0.020299911499023438, 0.02285003662109375, 0.025400161743164062, 0.027950286865234375, 0.030500411987304688, 0.033050537109375, 0.03560066223144531, 0.038150787353515625, 0.04070091247558594, 0.04325103759765625, 0.04580116271972656, 0.048351287841796875, 0.05090141296386719, 0.0534515380859375, 0.05600166320800781, 0.058551788330078125, 0.06110191345214844, 0.06365203857421875, 0.06620216369628906, 0.06875228881835938, 0.07130241394042969, 0.0738525390625]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 5.0, 3.0, 11.0, 22.0, 48.0, 213.0, 486.0, 125.0, 36.0, 17.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174560546875, -0.016898632049560547, -0.016341209411621094, -0.01578378677368164, -0.015226364135742188, -0.014668941497802734, -0.014111518859863281, -0.013554096221923828, -0.012996673583984375, -0.012439250946044922, -0.011881828308105469, -0.011324405670166016, -0.010766983032226562, -0.01020956039428711, -0.009652137756347656, -0.009094715118408203, -0.00853729248046875, -0.007979869842529297, -0.007422447204589844, -0.006865024566650391, -0.0063076019287109375, -0.005750179290771484, -0.005192756652832031, -0.004635334014892578, -0.004077911376953125, -0.003520488739013672, -0.0029630661010742188, -0.0024056434631347656, -0.0018482208251953125, -0.0012907981872558594, -0.0007333755493164062, -0.00017595291137695312, 0.0003814697265625, 0.0009388923645019531, 0.0014963150024414062, 0.0020537376403808594, 0.0026111602783203125, 0.0031685829162597656, 0.0037260055541992188, 0.004283428192138672, 0.004840850830078125, 0.005398273468017578, 0.005955696105957031, 0.006513118743896484, 0.0070705413818359375, 0.007627964019775391, 0.008185386657714844, 0.008742809295654297, 0.00930023193359375, 0.009857654571533203, 0.010415077209472656, 0.01097249984741211, 0.011529922485351562, 0.012087345123291016, 0.012644767761230469, 0.013202190399169922, 0.013759613037109375, 0.014317035675048828, 0.014874458312988281, 0.015431880950927734, 0.015989303588867188, 0.01654672622680664, 0.017104148864746094, 0.017661571502685547, 0.018218994140625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 14.0, 10.0, 32.0, 75.0, 165.0, 317.0, 228.0, 80.0, 27.0, 20.0, 20.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.034088611602783, -3.902669668197632, -3.7712504863739014, -3.63983154296875, -3.5084123611450195, -3.376993417739868, -3.245574474334717, -3.1141552925109863, -2.982736349105835, -2.8513174057006836, -2.719898223876953, -2.5884792804718018, -2.4570603370666504, -2.32564115524292, -2.1942222118377686, -2.062803268432617, -1.9313840866088867, -1.7999650239944458, -1.6685459613800049, -1.5371270179748535, -1.4057079553604126, -1.2742888927459717, -1.1428699493408203, -1.0114508867263794, -0.8800318241119385, -0.7486127614974976, -0.6171937584877014, -0.4857747256755829, -0.35435569286346436, -0.22293663024902344, -0.0915176272392273, 0.03990137577056885, 0.17132043838500977, 0.3027394711971283, 0.4341585040092468, 0.565577507019043, 0.6969965696334839, 0.8284156322479248, 0.959834635257721, 1.091253638267517, 1.222672700881958, 1.354091763496399, 1.4855108261108398, 1.6169297695159912, 1.7483488321304321, 1.879767894744873, 2.0111868381500244, 2.142605781555176, 2.2740249633789062, 2.4054439067840576, 2.536863088607788, 2.6682820320129395, 2.79970121383667, 2.9311201572418213, 3.0625391006469727, 3.193958282470703, 3.3253772258758545, 3.456796169281006, 3.5882153511047363, 3.7196342945098877, 3.851053237915039, 3.9824724197387695, 4.1138916015625, 4.245310306549072, 4.376729488372803]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 2.0, 5.0, 2.0, 5.0, 5.0, 10.0, 7.0, 19.0, 19.0, 31.0, 42.0, 47.0, 47.0, 62.0, 81.0, 79.0, 88.0, 79.0, 86.0, 57.0, 60.0, 51.0, 23.0, 28.0, 14.0, 11.0, 10.0, 5.0, 9.0, 4.0, 4.0, 2.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6598905324935913, -1.6129984855651855, -1.5661065578460693, -1.5192145109176636, -1.4723224639892578, -1.4254305362701416, -1.3785384893417358, -1.33164644241333, -1.2847545146942139, -1.237862467765808, -1.190970540046692, -1.1440784931182861, -1.09718656539917, -1.0502945184707642, -1.0034024715423584, -0.9565104842185974, -0.9096184968948364, -0.8627265095710754, -0.8158345222473145, -0.7689424753189087, -0.7220504879951477, -0.6751585006713867, -0.628266453742981, -0.58137446641922, -0.534482479095459, -0.487590491771698, -0.4406984746456146, -0.39380645751953125, -0.34691447019577026, -0.3000224828720093, -0.2531304657459259, -0.20623844861984253, -0.159346342086792, -0.11245433986186981, -0.06556233763694763, -0.01867033541202545, 0.02822166681289673, 0.07511366903781891, 0.12200567126274109, 0.16889768838882446, 0.21578967571258545, 0.26268166303634644, 0.3095736801624298, 0.3564656972885132, 0.40335768461227417, 0.45024967193603516, 0.49714168906211853, 0.5440337061882019, 0.5909256935119629, 0.6378176808357239, 0.6847096681594849, 0.7316017150878906, 0.7784937024116516, 0.8253856897354126, 0.8722777366638184, 0.9191697239875793, 0.9660617113113403, 1.012953758239746, 1.0598456859588623, 1.106737732887268, 1.1536297798156738, 1.20052170753479, 1.2474137544631958, 1.2943058013916016, 1.3411977291107178]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 12.0, 3.0, 18.0, 23.0, 40.0, 85.0, 169.0, 496.0, 1487.0, 7955.0, 125603.0, 865285.0, 41397.0, 4403.0, 976.0, 311.0, 146.0, 51.0, 33.0, 18.0, 14.0, 10.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.65625, -3.5316162109375, -3.406982421875, -3.2823486328125, -3.15771484375, -3.0330810546875, -2.908447265625, -2.7838134765625, -2.6591796875, -2.5345458984375, -2.409912109375, -2.2852783203125, -2.16064453125, -2.0360107421875, -1.911376953125, -1.7867431640625, -1.662109375, -1.5374755859375, -1.412841796875, -1.2882080078125, -1.16357421875, -1.0389404296875, -0.914306640625, -0.7896728515625, -0.6650390625, -0.5404052734375, -0.415771484375, -0.2911376953125, -0.16650390625, -0.0418701171875, 0.082763671875, 0.2073974609375, 0.33203125, 0.4566650390625, 0.581298828125, 0.7059326171875, 0.83056640625, 0.9552001953125, 1.079833984375, 1.2044677734375, 1.3291015625, 1.4537353515625, 1.578369140625, 1.7030029296875, 1.82763671875, 1.9522705078125, 2.076904296875, 2.2015380859375, 2.326171875, 2.4508056640625, 2.575439453125, 2.7000732421875, 2.82470703125, 2.9493408203125, 3.073974609375, 3.1986083984375, 3.3232421875, 3.4478759765625, 3.572509765625, 3.6971435546875, 3.82177734375, 3.9464111328125, 4.071044921875, 4.1956787109375, 4.3203125]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 10.0, 6.0, 11.0, 13.0, 32.0, 21.0, 36.0, 50.0, 57.0, 80.0, 86.0, 83.0, 106.0, 89.0, 77.0, 59.0, 47.0, 29.0, 30.0, 14.0, 11.0, 14.0, 7.0, 9.0, 4.0, 4.0, 1.0, 3.0, 3.0, 6.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.48828125, -3.379364013671875, -3.27044677734375, -3.161529541015625, -3.0526123046875, -2.943695068359375, -2.83477783203125, -2.725860595703125, -2.616943359375, -2.508026123046875, -2.39910888671875, -2.290191650390625, -2.1812744140625, -2.072357177734375, -1.96343994140625, -1.854522705078125, -1.74560546875, -1.636688232421875, -1.52777099609375, -1.418853759765625, -1.3099365234375, -1.201019287109375, -1.09210205078125, -0.983184814453125, -0.874267578125, -0.765350341796875, -0.65643310546875, -0.547515869140625, -0.4385986328125, -0.329681396484375, -0.22076416015625, -0.111846923828125, -0.0029296875, 0.105987548828125, 0.21490478515625, 0.323822021484375, 0.4327392578125, 0.541656494140625, 0.65057373046875, 0.759490966796875, 0.868408203125, 0.977325439453125, 1.08624267578125, 1.195159912109375, 1.3040771484375, 1.412994384765625, 1.52191162109375, 1.630828857421875, 1.73974609375, 1.848663330078125, 1.95758056640625, 2.066497802734375, 2.1754150390625, 2.284332275390625, 2.39324951171875, 2.502166748046875, 2.611083984375, 2.720001220703125, 2.82891845703125, 2.937835693359375, 3.0467529296875, 3.155670166015625, 3.26458740234375, 3.373504638671875, 3.482421875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 7.0, 3.0, 6.0, 7.0, 10.0, 6.0, 14.0, 19.0, 18.0, 27.0, 34.0, 30.0, 33.0, 58.0, 70.0, 84.0, 122.0, 207.0, 428.0, 1359.0, 6898.0, 77062.0, 873513.0, 78979.0, 7037.0, 1367.0, 424.0, 187.0, 124.0, 87.0, 65.0, 61.0, 36.0, 33.0, 26.0, 23.0, 26.0, 21.0, 12.0, 8.0, 5.0, 6.0, 4.0, 4.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5234375, -2.42822265625, -2.3330078125, -2.23779296875, -2.142578125, -2.04736328125, -1.9521484375, -1.85693359375, -1.76171875, -1.66650390625, -1.5712890625, -1.47607421875, -1.380859375, -1.28564453125, -1.1904296875, -1.09521484375, -1.0, -0.90478515625, -0.8095703125, -0.71435546875, -0.619140625, -0.52392578125, -0.4287109375, -0.33349609375, -0.23828125, -0.14306640625, -0.0478515625, 0.04736328125, 0.142578125, 0.23779296875, 0.3330078125, 0.42822265625, 0.5234375, 0.61865234375, 0.7138671875, 0.80908203125, 0.904296875, 0.99951171875, 1.0947265625, 1.18994140625, 1.28515625, 1.38037109375, 1.4755859375, 1.57080078125, 1.666015625, 1.76123046875, 1.8564453125, 1.95166015625, 2.046875, 2.14208984375, 2.2373046875, 2.33251953125, 2.427734375, 2.52294921875, 2.6181640625, 2.71337890625, 2.80859375, 2.90380859375, 2.9990234375, 3.09423828125, 3.189453125, 3.28466796875, 3.3798828125, 3.47509765625, 3.5703125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 0.0, 4.0, 7.0, 8.0, 11.0, 14.0, 14.0, 17.0, 17.0, 25.0, 13.0, 26.0, 25.0, 37.0, 36.0, 33.0, 43.0, 37.0, 43.0, 45.0, 38.0, 48.0, 49.0, 41.0, 39.0, 39.0, 35.0, 34.0, 30.0, 35.0, 27.0, 23.0, 18.0, 16.0, 16.0, 12.0, 15.0, 8.0, 5.0, 3.0, 5.0, 3.0, 6.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.015625, -1.940887451171875, -1.86614990234375, -1.791412353515625, -1.7166748046875, -1.641937255859375, -1.56719970703125, -1.492462158203125, -1.417724609375, -1.342987060546875, -1.26824951171875, -1.193511962890625, -1.1187744140625, -1.044036865234375, -0.96929931640625, -0.894561767578125, -0.81982421875, -0.745086669921875, -0.67034912109375, -0.595611572265625, -0.5208740234375, -0.446136474609375, -0.37139892578125, -0.296661376953125, -0.221923828125, -0.147186279296875, -0.07244873046875, 0.002288818359375, 0.0770263671875, 0.151763916015625, 0.22650146484375, 0.301239013671875, 0.3759765625, 0.450714111328125, 0.52545166015625, 0.600189208984375, 0.6749267578125, 0.749664306640625, 0.82440185546875, 0.899139404296875, 0.973876953125, 1.048614501953125, 1.12335205078125, 1.198089599609375, 1.2728271484375, 1.347564697265625, 1.42230224609375, 1.497039794921875, 1.57177734375, 1.646514892578125, 1.72125244140625, 1.795989990234375, 1.8707275390625, 1.945465087890625, 2.02020263671875, 2.094940185546875, 2.169677734375, 2.244415283203125, 2.31915283203125, 2.393890380859375, 2.4686279296875, 2.543365478515625, 2.61810302734375, 2.692840576171875, 2.767578125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 7.0, 6.0, 12.0, 9.0, 10.0, 23.0, 22.0, 43.0, 71.0, 96.0, 154.0, 270.0, 553.0, 979.0, 2057.0, 4563.0, 11780.0, 38181.0, 184736.0, 613324.0, 141751.0, 31721.0, 10128.0, 4179.0, 1818.0, 911.0, 491.0, 245.0, 154.0, 85.0, 51.0, 41.0, 25.0, 17.0, 12.0, 11.0, 5.0, 6.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.52197265625, -0.5053634643554688, -0.4887542724609375, -0.47214508056640625, -0.455535888671875, -0.43892669677734375, -0.4223175048828125, -0.40570831298828125, -0.38909912109375, -0.37248992919921875, -0.3558807373046875, -0.33927154541015625, -0.322662353515625, -0.30605316162109375, -0.2894439697265625, -0.27283477783203125, -0.2562255859375, -0.23961639404296875, -0.2230072021484375, -0.20639801025390625, -0.189788818359375, -0.17317962646484375, -0.1565704345703125, -0.13996124267578125, -0.12335205078125, -0.10674285888671875, -0.0901336669921875, -0.07352447509765625, -0.056915283203125, -0.04030609130859375, -0.0236968994140625, -0.00708770751953125, 0.009521484375, 0.02613067626953125, 0.0427398681640625, 0.05934906005859375, 0.075958251953125, 0.09256744384765625, 0.1091766357421875, 0.12578582763671875, 0.14239501953125, 0.15900421142578125, 0.1756134033203125, 0.19222259521484375, 0.208831787109375, 0.22544097900390625, 0.2420501708984375, 0.25865936279296875, 0.2752685546875, 0.29187774658203125, 0.3084869384765625, 0.32509613037109375, 0.341705322265625, 0.35831451416015625, 0.3749237060546875, 0.39153289794921875, 0.40814208984375, 0.42475128173828125, 0.4413604736328125, 0.45796966552734375, 0.474578857421875, 0.49118804931640625, 0.5077972412109375, 0.5244064331054688, 0.541015625]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 13.0, 16.0, 24.0, 32.0, 79.0, 113.0, 164.0, 186.0, 130.0, 90.0, 62.0, 34.0, 16.0, 12.0, 5.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00012767314910888672, -0.00012298673391342163, -0.00011830031871795654, -0.00011361390352249146, -0.00010892748832702637, -0.00010424107313156128, -9.955465793609619e-05, -9.48682427406311e-05, -9.018182754516602e-05, -8.549541234970093e-05, -8.080899715423584e-05, -7.612258195877075e-05, -7.143616676330566e-05, -6.674975156784058e-05, -6.206333637237549e-05, -5.73769211769104e-05, -5.269050598144531e-05, -4.8004090785980225e-05, -4.331767559051514e-05, -3.863126039505005e-05, -3.394484519958496e-05, -2.9258430004119873e-05, -2.4572014808654785e-05, -1.9885599613189697e-05, -1.519918441772461e-05, -1.0512769222259521e-05, -5.826354026794434e-06, -1.1399388313293457e-06, 3.546476364135742e-06, 8.23289155960083e-06, 1.2919306755065918e-05, 1.7605721950531006e-05, 2.2292137145996094e-05, 2.697855234146118e-05, 3.166496753692627e-05, 3.635138273239136e-05, 4.1037797927856445e-05, 4.572421312332153e-05, 5.041062831878662e-05, 5.509704351425171e-05, 5.97834587097168e-05, 6.446987390518188e-05, 6.915628910064697e-05, 7.384270429611206e-05, 7.852911949157715e-05, 8.321553468704224e-05, 8.790194988250732e-05, 9.258836507797241e-05, 9.72747802734375e-05, 0.00010196119546890259, 0.00010664761066436768, 0.00011133402585983276, 0.00011602044105529785, 0.00012070685625076294, 0.00012539327144622803, 0.00013007968664169312, 0.0001347661018371582, 0.0001394525170326233, 0.00014413893222808838, 0.00014882534742355347, 0.00015351176261901855, 0.00015819817781448364, 0.00016288459300994873, 0.00016757100820541382, 0.0001722574234008789]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 6.0, 9.0, 7.0, 5.0, 18.0, 28.0, 28.0, 46.0, 47.0, 100.0, 123.0, 189.0, 327.0, 472.0, 796.0, 1621.0, 3114.0, 6614.0, 16868.0, 53223.0, 251832.0, 542260.0, 119540.0, 30312.0, 10869.0, 4663.0, 2256.0, 1273.0, 648.0, 412.0, 282.0, 160.0, 122.0, 78.0, 62.0, 36.0, 32.0, 14.0, 16.0, 12.0, 9.0, 10.0, 7.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.465576171875, -0.4511528015136719, -0.43672943115234375, -0.4223060607910156, -0.4078826904296875, -0.3934593200683594, -0.37903594970703125, -0.3646125793457031, -0.350189208984375, -0.3357658386230469, -0.32134246826171875, -0.3069190979003906, -0.2924957275390625, -0.2780723571777344, -0.26364898681640625, -0.24922561645507812, -0.23480224609375, -0.22037887573242188, -0.20595550537109375, -0.19153213500976562, -0.1771087646484375, -0.16268539428710938, -0.14826202392578125, -0.13383865356445312, -0.119415283203125, -0.10499191284179688, -0.09056854248046875, -0.07614517211914062, -0.0617218017578125, -0.047298431396484375, -0.03287506103515625, -0.018451690673828125, -0.0040283203125, 0.010395050048828125, 0.02481842041015625, 0.039241790771484375, 0.0536651611328125, 0.06808853149414062, 0.08251190185546875, 0.09693527221679688, 0.111358642578125, 0.12578201293945312, 0.14020538330078125, 0.15462875366210938, 0.1690521240234375, 0.18347549438476562, 0.19789886474609375, 0.21232223510742188, 0.22674560546875, 0.24116897583007812, 0.25559234619140625, 0.2700157165527344, 0.2844390869140625, 0.2988624572753906, 0.31328582763671875, 0.3277091979980469, 0.342132568359375, 0.3565559387207031, 0.37097930908203125, 0.3854026794433594, 0.3998260498046875, 0.4142494201660156, 0.42867279052734375, 0.4430961608886719, 0.45751953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 5.0, 3.0, 10.0, 5.0, 7.0, 12.0, 9.0, 18.0, 21.0, 19.0, 20.0, 39.0, 51.0, 61.0, 71.0, 90.0, 105.0, 99.0, 64.0, 68.0, 52.0, 46.0, 20.0, 24.0, 19.0, 12.0, 9.0, 8.0, 6.0, 3.0, 5.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.241943359375, -0.23424911499023438, -0.22655487060546875, -0.21886062622070312, -0.2111663818359375, -0.20347213745117188, -0.19577789306640625, -0.18808364868164062, -0.180389404296875, -0.17269515991210938, -0.16500091552734375, -0.15730667114257812, -0.1496124267578125, -0.14191818237304688, -0.13422393798828125, -0.12652969360351562, -0.11883544921875, -0.11114120483398438, -0.10344696044921875, -0.09575271606445312, -0.0880584716796875, -0.08036422729492188, -0.07266998291015625, -0.06497573852539062, -0.057281494140625, -0.049587249755859375, -0.04189300537109375, -0.034198760986328125, -0.0265045166015625, -0.018810272216796875, -0.01111602783203125, -0.003421783447265625, 0.0042724609375, 0.011966705322265625, 0.01966094970703125, 0.027355194091796875, 0.0350494384765625, 0.042743682861328125, 0.05043792724609375, 0.058132171630859375, 0.065826416015625, 0.07352066040039062, 0.08121490478515625, 0.08890914916992188, 0.0966033935546875, 0.10429763793945312, 0.11199188232421875, 0.11968612670898438, 0.12738037109375, 0.13507461547851562, 0.14276885986328125, 0.15046310424804688, 0.1581573486328125, 0.16585159301757812, 0.17354583740234375, 0.18124008178710938, 0.188934326171875, 0.19662857055664062, 0.20432281494140625, 0.21201705932617188, 0.2197113037109375, 0.22740554809570312, 0.23509979248046875, 0.24279403686523438, 0.25048828125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 5.0, 9.0, 15.0, 29.0, 61.0, 153.0, 259.0, 250.0, 124.0, 43.0, 26.0, 12.0, 4.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.284575462341309, -8.025139808654785, -7.7657036781311035, -7.50626802444458, -7.246831893920898, -6.987396240234375, -6.727960586547852, -6.468524932861328, -6.2090888023376465, -5.949653148651123, -5.690217018127441, -5.430781364440918, -5.1713457107543945, -4.911909580230713, -4.6524739265441895, -4.393037796020508, -4.133602142333984, -3.874166250228882, -3.6147303581237793, -3.355294704437256, -3.0958588123321533, -2.836422920227051, -2.5769872665405273, -2.317551374435425, -2.0581154823303223, -1.7986795902252197, -1.5392438173294067, -1.2798080444335938, -1.0203721523284912, -0.7609362602233887, -0.5015004873275757, -0.2420647144317627, 0.01737213134765625, 0.276807963848114, 0.5362437963485718, 0.7956796288490295, 1.0551154613494873, 1.3145513534545898, 1.5739871263504028, 1.8334228992462158, 2.0928587913513184, 2.352294683456421, 2.6117305755615234, 2.871166229248047, 3.1306021213531494, 3.390038013458252, 3.6494736671447754, 3.908909559249878, 4.1683454513549805, 4.427781105041504, 4.6872172355651855, 4.946652889251709, 5.206089019775391, 5.465524673461914, 5.7249603271484375, 5.984395980834961, 6.243832111358643, 6.503267765045166, 6.762703895568848, 7.022139549255371, 7.2815752029418945, 7.541011333465576, 7.8004469871521, 8.059883117675781, 8.319318771362305]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 6.0, 6.0, 12.0, 16.0, 6.0, 14.0, 12.0, 17.0, 21.0, 23.0, 30.0, 35.0, 50.0, 35.0, 44.0, 38.0, 44.0, 40.0, 42.0, 43.0, 41.0, 51.0, 54.0, 43.0, 43.0, 25.0, 38.0, 32.0, 18.0, 25.0, 13.0, 14.0, 11.0, 7.0, 13.0, 7.0, 4.0, 6.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.649759769439697, -4.511108875274658, -4.372457504272461, -4.233806610107422, -4.095155715942383, -3.9565045833587646, -3.8178534507751465, -3.6792025566101074, -3.5405514240264893, -3.401900291442871, -3.263249397277832, -3.124598264694214, -2.9859471321105957, -2.8472962379455566, -2.7086451053619385, -2.5699939727783203, -2.4313430786132812, -2.292691946029663, -2.154041051864624, -2.015389919281006, -1.8767389059066772, -1.7380878925323486, -1.5994367599487305, -1.4607857465744019, -1.3221347332000732, -1.1834837198257446, -1.044832706451416, -0.9061815738677979, -0.7675305604934692, -0.6288795471191406, -0.49022847414016724, -0.35157740116119385, -0.21292686462402344, -0.07427582144737244, 0.06437522172927856, 0.20302626490592957, 0.34167730808258057, 0.4803283214569092, 0.6189793944358826, 0.757630467414856, 0.8962814807891846, 1.0349324941635132, 1.1735835075378418, 1.31223464012146, 1.4508856534957886, 1.5895366668701172, 1.7281877994537354, 1.866838812828064, 2.0054898262023926, 2.1441409587860107, 2.28279185295105, 2.421442985534668, 2.560093879699707, 2.698745012283325, 2.8373961448669434, 2.9760470390319824, 3.1146981716156006, 3.2533493041992188, 3.392000198364258, 3.530651330947876, 3.669302463531494, 3.807953357696533, 3.9466044902801514, 4.0852556228637695, 4.223906517028809]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 5.0, 10.0, 16.0, 24.0, 26.0, 42.0, 54.0, 96.0, 124.0, 225.0, 403.0, 768.0, 1512.0, 3654.0, 10165.0, 39215.0, 292856.0, 3552183.0, 241775.0, 34840.0, 9528.0, 3464.0, 1475.0, 707.0, 415.0, 255.0, 124.0, 101.0, 67.0, 38.0, 38.0, 26.0, 12.0, 11.0, 9.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.244140625, -2.172821044921875, -2.10150146484375, -2.030181884765625, -1.9588623046875, -1.887542724609375, -1.81622314453125, -1.744903564453125, -1.673583984375, -1.602264404296875, -1.53094482421875, -1.459625244140625, -1.3883056640625, -1.316986083984375, -1.24566650390625, -1.174346923828125, -1.10302734375, -1.031707763671875, -0.96038818359375, -0.889068603515625, -0.8177490234375, -0.746429443359375, -0.67510986328125, -0.603790283203125, -0.532470703125, -0.461151123046875, -0.38983154296875, -0.318511962890625, -0.2471923828125, -0.175872802734375, -0.10455322265625, -0.033233642578125, 0.0380859375, 0.109405517578125, 0.18072509765625, 0.252044677734375, 0.3233642578125, 0.394683837890625, 0.46600341796875, 0.537322998046875, 0.608642578125, 0.679962158203125, 0.75128173828125, 0.822601318359375, 0.8939208984375, 0.965240478515625, 1.03656005859375, 1.107879638671875, 1.17919921875, 1.250518798828125, 1.32183837890625, 1.393157958984375, 1.4644775390625, 1.535797119140625, 1.60711669921875, 1.678436279296875, 1.749755859375, 1.821075439453125, 1.89239501953125, 1.963714599609375, 2.0350341796875, 2.106353759765625, 2.17767333984375, 2.248992919921875, 2.3203125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 0.0, 2.0, 6.0, 5.0, 11.0, 10.0, 25.0, 15.0, 29.0, 26.0, 31.0, 52.0, 62.0, 76.0, 73.0, 73.0, 85.0, 77.0, 55.0, 64.0, 50.0, 46.0, 15.0, 25.0, 24.0, 12.0, 9.0, 10.0, 5.0, 8.0, 7.0, 4.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 2.0, 2.0], "bins": [-2.25, -2.193817138671875, -2.13763427734375, -2.081451416015625, -2.0252685546875, -1.969085693359375, -1.91290283203125, -1.856719970703125, -1.800537109375, -1.744354248046875, -1.68817138671875, -1.631988525390625, -1.5758056640625, -1.519622802734375, -1.46343994140625, -1.407257080078125, -1.35107421875, -1.294891357421875, -1.23870849609375, -1.182525634765625, -1.1263427734375, -1.070159912109375, -1.01397705078125, -0.957794189453125, -0.901611328125, -0.845428466796875, -0.78924560546875, -0.733062744140625, -0.6768798828125, -0.620697021484375, -0.56451416015625, -0.508331298828125, -0.4521484375, -0.395965576171875, -0.33978271484375, -0.283599853515625, -0.2274169921875, -0.171234130859375, -0.11505126953125, -0.058868408203125, -0.002685546875, 0.053497314453125, 0.10968017578125, 0.165863037109375, 0.2220458984375, 0.278228759765625, 0.33441162109375, 0.390594482421875, 0.44677734375, 0.502960205078125, 0.55914306640625, 0.615325927734375, 0.6715087890625, 0.727691650390625, 0.78387451171875, 0.840057373046875, 0.896240234375, 0.952423095703125, 1.00860595703125, 1.064788818359375, 1.1209716796875, 1.177154541015625, 1.23333740234375, 1.289520263671875, 1.345703125]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 4.0, 1.0, 4.0, 2.0, 5.0, 7.0, 12.0, 15.0, 17.0, 27.0, 53.0, 45.0, 88.0, 192.0, 480.0, 1938.0, 16802.0, 3451822.0, 709135.0, 11286.0, 1555.0, 409.0, 148.0, 76.0, 43.0, 21.0, 26.0, 15.0, 20.0, 5.0, 8.0, 5.0, 2.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.359375, -5.19659423828125, -5.0338134765625, -4.87103271484375, -4.708251953125, -4.54547119140625, -4.3826904296875, -4.21990966796875, -4.05712890625, -3.89434814453125, -3.7315673828125, -3.56878662109375, -3.406005859375, -3.24322509765625, -3.0804443359375, -2.91766357421875, -2.7548828125, -2.59210205078125, -2.4293212890625, -2.26654052734375, -2.103759765625, -1.94097900390625, -1.7781982421875, -1.61541748046875, -1.45263671875, -1.28985595703125, -1.1270751953125, -0.96429443359375, -0.801513671875, -0.63873291015625, -0.4759521484375, -0.31317138671875, -0.150390625, 0.01239013671875, 0.1751708984375, 0.33795166015625, 0.500732421875, 0.66351318359375, 0.8262939453125, 0.98907470703125, 1.15185546875, 1.31463623046875, 1.4774169921875, 1.64019775390625, 1.802978515625, 1.96575927734375, 2.1285400390625, 2.29132080078125, 2.4541015625, 2.61688232421875, 2.7796630859375, 2.94244384765625, 3.105224609375, 3.26800537109375, 3.4307861328125, 3.59356689453125, 3.75634765625, 3.91912841796875, 4.0819091796875, 4.24468994140625, 4.407470703125, 4.57025146484375, 4.7330322265625, 4.89581298828125, 5.05859375]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 2.0, 5.0, 7.0, 8.0, 16.0, 16.0, 21.0, 31.0, 42.0, 57.0, 68.0, 94.0, 159.0, 260.0, 502.0, 1362.0, 552.0, 273.0, 167.0, 114.0, 86.0, 60.0, 37.0, 22.0, 18.0, 26.0, 13.0, 15.0, 6.0, 4.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.478271484375, -0.4621086120605469, -0.44594573974609375, -0.4297828674316406, -0.4136199951171875, -0.3974571228027344, -0.38129425048828125, -0.3651313781738281, -0.348968505859375, -0.3328056335449219, -0.31664276123046875, -0.3004798889160156, -0.2843170166015625, -0.2681541442871094, -0.25199127197265625, -0.23582839965820312, -0.21966552734375, -0.20350265502929688, -0.18733978271484375, -0.17117691040039062, -0.1550140380859375, -0.13885116577148438, -0.12268829345703125, -0.10652542114257812, -0.090362548828125, -0.07419967651367188, -0.05803680419921875, -0.041873931884765625, -0.0257110595703125, -0.009548187255859375, 0.00661468505859375, 0.022777557373046875, 0.0389404296875, 0.055103302001953125, 0.07126617431640625, 0.08742904663085938, 0.1035919189453125, 0.11975479125976562, 0.13591766357421875, 0.15208053588867188, 0.168243408203125, 0.18440628051757812, 0.20056915283203125, 0.21673202514648438, 0.2328948974609375, 0.24905776977539062, 0.26522064208984375, 0.2813835144042969, 0.29754638671875, 0.3137092590332031, 0.32987213134765625, 0.3460350036621094, 0.3621978759765625, 0.3783607482910156, 0.39452362060546875, 0.4106864929199219, 0.426849365234375, 0.4430122375488281, 0.45917510986328125, 0.4753379821777344, 0.4915008544921875, 0.5076637268066406, 0.5238265991210938, 0.5399894714355469, 0.55615234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 5.0, 9.0, 18.0, 19.0, 41.0, 70.0, 119.0, 174.0, 205.0, 151.0, 80.0, 39.0, 21.0, 11.0, 9.0, 8.0, 6.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.946353912353516, -4.822999000549316, -4.699644088745117, -4.57628870010376, -4.4529337882995605, -4.329578876495361, -4.206223964691162, -4.082868576049805, -3.9595136642456055, -3.8361587524414062, -3.712803602218628, -3.5894486904144287, -3.4660935401916504, -3.342738628387451, -3.219383716583252, -3.0960285663604736, -2.9726736545562744, -2.849318742752075, -2.725963592529297, -2.6026086807250977, -2.4792535305023193, -2.35589861869812, -2.232543468475342, -2.1091885566711426, -1.9858335256576538, -1.862478494644165, -1.7391234636306763, -1.6157684326171875, -1.4924135208129883, -1.36905837059021, -1.2457034587860107, -1.122348427772522, -0.9989931583404541, -0.8756381273269653, -0.7522830963134766, -0.6289281249046326, -0.5055730938911438, -0.38221806287765503, -0.25886309146881104, -0.13550806045532227, -0.012153029441833496, 0.11120198667049408, 0.23455700278282166, 0.35791200399398804, 0.4812670350074768, 0.6046220660209656, 0.7279770374298096, 0.8513320684432983, 0.9746870994567871, 1.0980421304702759, 1.2213971614837646, 1.3447520732879639, 1.4681072235107422, 1.5914621353149414, 1.7148171663284302, 1.838172197341919, 1.9615272283554077, 2.0848822593688965, 2.2082371711730957, 2.331592321395874, 2.4549472332000732, 2.5783023834228516, 2.701657295227051, 2.82501220703125, 2.9483673572540283]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 4.0, 8.0, 7.0, 11.0, 17.0, 19.0, 20.0, 35.0, 35.0, 49.0, 40.0, 74.0, 67.0, 71.0, 79.0, 73.0, 70.0, 66.0, 62.0, 47.0, 27.0, 29.0, 18.0, 15.0, 11.0, 6.0, 10.0, 9.0, 5.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1518020629882812, -2.0881271362304688, -2.0244522094726562, -1.9607775211334229, -1.8971025943756104, -1.8334276676177979, -1.769752860069275, -1.706078052520752, -1.6424031257629395, -1.578728199005127, -1.515053391456604, -1.451378583908081, -1.3877036571502686, -1.324028730392456, -1.260353922843933, -1.1966791152954102, -1.1330041885375977, -1.0693292617797852, -1.0056544542312622, -0.9419795870780945, -0.8783047199249268, -0.814629852771759, -0.7509549856185913, -0.6872801184654236, -0.6236052513122559, -0.5599303841590881, -0.4962555170059204, -0.4325806498527527, -0.36890578269958496, -0.30523091554641724, -0.2415560483932495, -0.1778811812400818, -0.11420643329620361, -0.05053156614303589, 0.013143301010131836, 0.07681816816329956, 0.14049303531646729, 0.204167902469635, 0.26784276962280273, 0.33151763677597046, 0.3951925039291382, 0.4588673710823059, 0.5225422382354736, 0.5862171053886414, 0.6498919725418091, 0.7135668396949768, 0.7772417068481445, 0.8409165740013123, 0.90459144115448, 0.9682663083076477, 1.0319411754608154, 1.095616102218628, 1.1592909097671509, 1.2229657173156738, 1.2866406440734863, 1.3503155708312988, 1.4139903783798218, 1.4776651859283447, 1.5413401126861572, 1.6050150394439697, 1.6686898469924927, 1.7323646545410156, 1.7960395812988281, 1.8597145080566406, 1.9233893156051636]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 6.0, 3.0, 9.0, 12.0, 14.0, 20.0, 33.0, 42.0, 61.0, 99.0, 140.0, 212.0, 330.0, 512.0, 812.0, 1303.0, 2229.0, 3946.0, 7594.0, 16364.0, 40097.0, 125456.0, 445328.0, 276998.0, 74611.0, 26928.0, 11835.0, 5772.0, 3111.0, 1762.0, 1039.0, 637.0, 399.0, 258.0, 189.0, 135.0, 85.0, 45.0, 34.0, 21.0, 25.0, 11.0, 18.0, 10.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.10626220703125, -0.10281085968017578, -0.09935951232910156, -0.09590816497802734, -0.09245681762695312, -0.0890054702758789, -0.08555412292480469, -0.08210277557373047, -0.07865142822265625, -0.07520008087158203, -0.07174873352050781, -0.0682973861694336, -0.06484603881835938, -0.061394691467285156, -0.05794334411621094, -0.05449199676513672, -0.0510406494140625, -0.04758930206298828, -0.04413795471191406, -0.040686607360839844, -0.037235260009765625, -0.033783912658691406, -0.030332565307617188, -0.02688121795654297, -0.02342987060546875, -0.01997852325439453, -0.016527175903320312, -0.013075828552246094, -0.009624481201171875, -0.006173133850097656, -0.0027217864990234375, 0.0007295608520507812, 0.004180908203125, 0.007632255554199219, 0.011083602905273438, 0.014534950256347656, 0.017986297607421875, 0.021437644958496094, 0.024888992309570312, 0.02834033966064453, 0.03179168701171875, 0.03524303436279297, 0.03869438171386719, 0.042145729064941406, 0.045597076416015625, 0.049048423767089844, 0.05249977111816406, 0.05595111846923828, 0.0594024658203125, 0.06285381317138672, 0.06630516052246094, 0.06975650787353516, 0.07320785522460938, 0.0766592025756836, 0.08011054992675781, 0.08356189727783203, 0.08701324462890625, 0.09046459197998047, 0.09391593933105469, 0.0973672866821289, 0.10081863403320312, 0.10426998138427734, 0.10772132873535156, 0.11117267608642578, 0.1146240234375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 7.0, 5.0, 8.0, 7.0, 12.0, 16.0, 23.0, 22.0, 46.0, 42.0, 62.0, 63.0, 86.0, 90.0, 81.0, 86.0, 72.0, 73.0, 42.0, 35.0, 26.0, 17.0, 13.0, 19.0, 6.0, 8.0, 7.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.576171875, -1.5284881591796875, -1.480804443359375, -1.4331207275390625, -1.38543701171875, -1.3377532958984375, -1.290069580078125, -1.2423858642578125, -1.1947021484375, -1.1470184326171875, -1.099334716796875, -1.0516510009765625, -1.00396728515625, -0.9562835693359375, -0.908599853515625, -0.8609161376953125, -0.813232421875, -0.7655487060546875, -0.717864990234375, -0.6701812744140625, -0.62249755859375, -0.5748138427734375, -0.527130126953125, -0.4794464111328125, -0.4317626953125, -0.3840789794921875, -0.336395263671875, -0.2887115478515625, -0.24102783203125, -0.1933441162109375, -0.145660400390625, -0.0979766845703125, -0.05029296875, -0.0026092529296875, 0.045074462890625, 0.0927581787109375, 0.14044189453125, 0.1881256103515625, 0.235809326171875, 0.2834930419921875, 0.3311767578125, 0.3788604736328125, 0.426544189453125, 0.4742279052734375, 0.52191162109375, 0.5695953369140625, 0.617279052734375, 0.6649627685546875, 0.712646484375, 0.7603302001953125, 0.808013916015625, 0.8556976318359375, 0.90338134765625, 0.9510650634765625, 0.998748779296875, 1.0464324951171875, 1.0941162109375, 1.1417999267578125, 1.189483642578125, 1.2371673583984375, 1.28485107421875, 1.3325347900390625, 1.380218505859375, 1.4279022216796875, 1.4755859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 5.0, 9.0, 8.0, 12.0, 14.0, 20.0, 32.0, 31.0, 50.0, 62.0, 87.0, 126.0, 208.0, 291.0, 516.0, 1487.0, 7296.0, 55685.0, 651203.0, 299901.0, 25240.0, 3994.0, 1065.0, 389.0, 234.0, 130.0, 103.0, 72.0, 69.0, 52.0, 34.0, 24.0, 19.0, 12.0, 14.0, 11.0, 12.0, 8.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1751708984375, -0.16948890686035156, -0.16380691528320312, -0.1581249237060547, -0.15244293212890625, -0.1467609405517578, -0.14107894897460938, -0.13539695739746094, -0.1297149658203125, -0.12403297424316406, -0.11835098266601562, -0.11266899108886719, -0.10698699951171875, -0.10130500793457031, -0.09562301635742188, -0.08994102478027344, -0.084259033203125, -0.07857704162597656, -0.07289505004882812, -0.06721305847167969, -0.06153106689453125, -0.05584907531738281, -0.050167083740234375, -0.04448509216308594, -0.0388031005859375, -0.03312110900878906, -0.027439117431640625, -0.021757125854492188, -0.01607513427734375, -0.010393142700195312, -0.004711151123046875, 0.0009708404541015625, 0.00665283203125, 0.012334823608398438, 0.018016815185546875, 0.023698806762695312, 0.02938079833984375, 0.03506278991699219, 0.040744781494140625, 0.04642677307128906, 0.0521087646484375, 0.05779075622558594, 0.06347274780273438, 0.06915473937988281, 0.07483673095703125, 0.08051872253417969, 0.08620071411132812, 0.09188270568847656, 0.097564697265625, 0.10324668884277344, 0.10892868041992188, 0.11461067199707031, 0.12029266357421875, 0.1259746551513672, 0.13165664672851562, 0.13733863830566406, 0.1430206298828125, 0.14870262145996094, 0.15438461303710938, 0.1600666046142578, 0.16574859619140625, 0.1714305877685547, 0.17711257934570312, 0.18279457092285156, 0.1884765625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 5.0, 9.0, 9.0, 7.0, 15.0, 17.0, 13.0, 24.0, 31.0, 35.0, 44.0, 39.0, 55.0, 59.0, 47.0, 63.0, 55.0, 54.0, 55.0, 63.0, 56.0, 35.0, 26.0, 31.0, 31.0, 28.0, 19.0, 14.0, 15.0, 11.0, 8.0, 9.0, 2.0, 4.0, 5.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.162109375, -2.093719482421875, -2.02532958984375, -1.956939697265625, -1.8885498046875, -1.820159912109375, -1.75177001953125, -1.683380126953125, -1.614990234375, -1.546600341796875, -1.47821044921875, -1.409820556640625, -1.3414306640625, -1.273040771484375, -1.20465087890625, -1.136260986328125, -1.06787109375, -0.999481201171875, -0.93109130859375, -0.862701416015625, -0.7943115234375, -0.725921630859375, -0.65753173828125, -0.589141845703125, -0.520751953125, -0.452362060546875, -0.38397216796875, -0.315582275390625, -0.2471923828125, -0.178802490234375, -0.11041259765625, -0.042022705078125, 0.0263671875, 0.094757080078125, 0.16314697265625, 0.231536865234375, 0.2999267578125, 0.368316650390625, 0.43670654296875, 0.505096435546875, 0.573486328125, 0.641876220703125, 0.71026611328125, 0.778656005859375, 0.8470458984375, 0.915435791015625, 0.98382568359375, 1.052215576171875, 1.12060546875, 1.188995361328125, 1.25738525390625, 1.325775146484375, 1.3941650390625, 1.462554931640625, 1.53094482421875, 1.599334716796875, 1.667724609375, 1.736114501953125, 1.80450439453125, 1.872894287109375, 1.9412841796875, 2.009674072265625, 2.07806396484375, 2.146453857421875, 2.21484375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 7.0, 8.0, 14.0, 18.0, 20.0, 32.0, 53.0, 74.0, 130.0, 208.0, 340.0, 669.0, 1717.0, 10856.0, 492040.0, 527740.0, 11292.0, 1729.0, 653.0, 357.0, 217.0, 134.0, 83.0, 56.0, 39.0, 17.0, 13.0, 7.0, 10.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.045074462890625, -0.04370880126953125, -0.0423431396484375, -0.04097747802734375, -0.03961181640625, -0.03824615478515625, -0.0368804931640625, -0.03551483154296875, -0.034149169921875, -0.03278350830078125, -0.0314178466796875, -0.03005218505859375, -0.0286865234375, -0.02732086181640625, -0.0259552001953125, -0.02458953857421875, -0.023223876953125, -0.02185821533203125, -0.0204925537109375, -0.01912689208984375, -0.01776123046875, -0.01639556884765625, -0.0150299072265625, -0.01366424560546875, -0.012298583984375, -0.01093292236328125, -0.0095672607421875, -0.00820159912109375, -0.0068359375, -0.00547027587890625, -0.0041046142578125, -0.00273895263671875, -0.001373291015625, -7.62939453125e-06, 0.0013580322265625, 0.00272369384765625, 0.00408935546875, 0.00545501708984375, 0.0068206787109375, 0.00818634033203125, 0.009552001953125, 0.01091766357421875, 0.0122833251953125, 0.01364898681640625, 0.0150146484375, 0.01638031005859375, 0.0177459716796875, 0.01911163330078125, 0.020477294921875, 0.02184295654296875, 0.0232086181640625, 0.02457427978515625, 0.02593994140625, 0.02730560302734375, 0.0286712646484375, 0.03003692626953125, 0.031402587890625, 0.03276824951171875, 0.0341339111328125, 0.03549957275390625, 0.036865234375, 0.03823089599609375, 0.0395965576171875, 0.04096221923828125, 0.042327880859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 5.0, 3.0, 14.0, 9.0, 8.0, 20.0, 31.0, 30.0, 45.0, 55.0, 72.0, 85.0, 98.0, 75.0, 81.0, 89.0, 60.0, 50.0, 45.0, 34.0, 22.0, 18.0, 14.0, 6.0, 10.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.436471939086914e-05, -1.3834796845912933e-05, -1.3304874300956726e-05, -1.2774951756000519e-05, -1.2245029211044312e-05, -1.1715106666088104e-05, -1.1185184121131897e-05, -1.065526157617569e-05, -1.0125339031219482e-05, -9.595416486263275e-06, -9.065493941307068e-06, -8.53557139635086e-06, -8.005648851394653e-06, -7.475726306438446e-06, -6.945803761482239e-06, -6.4158812165260315e-06, -5.885958671569824e-06, -5.356036126613617e-06, -4.82611358165741e-06, -4.296191036701202e-06, -3.766268491744995e-06, -3.236345946788788e-06, -2.7064234018325806e-06, -2.1765008568763733e-06, -1.646578311920166e-06, -1.1166557669639587e-06, -5.867332220077515e-07, -5.681067705154419e-08, 4.731118679046631e-07, 1.0030344128608704e-06, 1.5329569578170776e-06, 2.062879502773285e-06, 2.592802047729492e-06, 3.1227245926856995e-06, 3.6526471376419067e-06, 4.182569682598114e-06, 4.712492227554321e-06, 5.2424147725105286e-06, 5.772337317466736e-06, 6.302259862422943e-06, 6.83218240737915e-06, 7.362104952335358e-06, 7.892027497291565e-06, 8.421950042247772e-06, 8.95187258720398e-06, 9.481795132160187e-06, 1.0011717677116394e-05, 1.0541640222072601e-05, 1.1071562767028809e-05, 1.1601485311985016e-05, 1.2131407856941223e-05, 1.266133040189743e-05, 1.3191252946853638e-05, 1.3721175491809845e-05, 1.4251098036766052e-05, 1.478102058172226e-05, 1.5310943126678467e-05, 1.5840865671634674e-05, 1.637078821659088e-05, 1.690071076154709e-05, 1.7430633306503296e-05, 1.7960555851459503e-05, 1.849047839641571e-05, 1.9020400941371918e-05, 1.9550323486328125e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 9.0, 20.0, 32.0, 65.0, 87.0, 126.0, 202.0, 371.0, 752.0, 1538.0, 3781.0, 11106.0, 45744.0, 576715.0, 356808.0, 35641.0, 9197.0, 3381.0, 1403.0, 639.0, 353.0, 228.0, 128.0, 67.0, 35.0, 35.0, 19.0, 17.0, 16.0, 3.0, 6.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037384033203125, -0.03624868392944336, -0.03511333465576172, -0.03397798538208008, -0.03284263610839844, -0.0317072868347168, -0.030571937561035156, -0.029436588287353516, -0.028301239013671875, -0.027165889739990234, -0.026030540466308594, -0.024895191192626953, -0.023759841918945312, -0.022624492645263672, -0.02148914337158203, -0.02035379409790039, -0.01921844482421875, -0.01808309555053711, -0.01694774627685547, -0.015812397003173828, -0.014677047729492188, -0.013541698455810547, -0.012406349182128906, -0.011270999908447266, -0.010135650634765625, -0.009000301361083984, -0.007864952087402344, -0.006729602813720703, -0.0055942535400390625, -0.004458904266357422, -0.0033235549926757812, -0.0021882057189941406, -0.0010528564453125, 8.249282836914062e-05, 0.0012178421020507812, 0.002353191375732422, 0.0034885406494140625, 0.004623889923095703, 0.005759239196777344, 0.006894588470458984, 0.008029937744140625, 0.009165287017822266, 0.010300636291503906, 0.011435985565185547, 0.012571334838867188, 0.013706684112548828, 0.014842033386230469, 0.01597738265991211, 0.01711273193359375, 0.01824808120727539, 0.01938343048095703, 0.020518779754638672, 0.021654129028320312, 0.022789478302001953, 0.023924827575683594, 0.025060176849365234, 0.026195526123046875, 0.027330875396728516, 0.028466224670410156, 0.029601573944091797, 0.030736923217773438, 0.03187227249145508, 0.03300762176513672, 0.03414297103881836, 0.0352783203125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 8.0, 15.0, 23.0, 40.0, 70.0, 121.0, 264.0, 212.0, 71.0, 63.0, 29.0, 32.0, 13.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00811004638671875, -0.007876873016357422, -0.007643699645996094, -0.007410526275634766, -0.0071773529052734375, -0.006944179534912109, -0.006711006164550781, -0.006477832794189453, -0.006244659423828125, -0.006011486053466797, -0.005778312683105469, -0.005545139312744141, -0.0053119659423828125, -0.005078792572021484, -0.004845619201660156, -0.004612445831298828, -0.0043792724609375, -0.004146099090576172, -0.003912925720214844, -0.0036797523498535156, -0.0034465789794921875, -0.0032134056091308594, -0.0029802322387695312, -0.002747058868408203, -0.002513885498046875, -0.002280712127685547, -0.0020475387573242188, -0.0018143653869628906, -0.0015811920166015625, -0.0013480186462402344, -0.0011148452758789062, -0.0008816719055175781, -0.00064849853515625, -0.0004153251647949219, -0.00018215179443359375, 5.1021575927734375e-05, 0.0002841949462890625, 0.0005173683166503906, 0.0007505416870117188, 0.0009837150573730469, 0.001216888427734375, 0.0014500617980957031, 0.0016832351684570312, 0.0019164085388183594, 0.0021495819091796875, 0.0023827552795410156, 0.0026159286499023438, 0.002849102020263672, 0.003082275390625, 0.003315448760986328, 0.0035486221313476562, 0.0037817955017089844, 0.0040149688720703125, 0.004248142242431641, 0.004481315612792969, 0.004714488983154297, 0.004947662353515625, 0.005180835723876953, 0.005414009094238281, 0.005647182464599609, 0.0058803558349609375, 0.006113529205322266, 0.006346702575683594, 0.006579875946044922, 0.00681304931640625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 15.0, 16.0, 23.0, 66.0, 107.0, 174.0, 251.0, 167.0, 81.0, 33.0, 19.0, 14.0, 7.0, 8.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.545215129852295, -3.450169324874878, -3.355123281478882, -3.260077476501465, -3.1650314331054688, -3.0699856281280518, -2.9749398231506348, -2.8798937797546387, -2.7848479747772217, -2.6898021697998047, -2.5947561264038086, -2.4997103214263916, -2.4046645164489746, -2.3096184730529785, -2.2145726680755615, -2.1195268630981445, -2.0244808197021484, -1.929434895515442, -1.8343889713287354, -1.7393431663513184, -1.6442972421646118, -1.5492513179779053, -1.4542055130004883, -1.3591595888137817, -1.2641136646270752, -1.1690677404403687, -1.074021816253662, -0.9789760112762451, -0.8839300870895386, -0.788884162902832, -0.6938382983207703, -0.5987924337387085, -0.503746509552002, -0.4087006151676178, -0.31365472078323364, -0.2186088263988495, -0.12356293201446533, -0.028517037630081177, 0.06652885675430298, 0.16157472133636475, 0.2566206455230713, 0.35166653990745544, 0.4467124342918396, 0.5417582988739014, 0.6368042230606079, 0.7318501472473145, 0.8268960118293762, 0.921941876411438, 1.0169878005981445, 1.112033724784851, 1.2070796489715576, 1.3021254539489746, 1.3971713781356812, 1.4922173023223877, 1.5872631072998047, 1.6823090314865112, 1.7773549556732178, 1.8724008798599243, 1.9674468040466309, 2.062492609024048, 2.157538414001465, 2.252584457397461, 2.347630262374878, 2.442676067352295, 2.537722110748291]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 8.0, 6.0, 8.0, 9.0, 14.0, 17.0, 25.0, 30.0, 43.0, 54.0, 60.0, 77.0, 88.0, 88.0, 91.0, 74.0, 74.0, 62.0, 43.0, 23.0, 26.0, 13.0, 19.0, 6.0, 8.0, 11.0, 6.0, 7.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6878008842468262, -1.6405261754989624, -1.593251347541809, -1.5459766387939453, -1.498701810836792, -1.4514271020889282, -1.4041523933410645, -1.3568775653839111, -1.3096028566360474, -1.2623281478881836, -1.2150533199310303, -1.1677786111831665, -1.1205039024353027, -1.0732290744781494, -1.0259543657302856, -0.9786795973777771, -0.9314048290252686, -0.88413006067276, -0.8368552923202515, -0.7895805835723877, -0.7423058152198792, -0.6950310468673706, -0.6477563381195068, -0.6004815697669983, -0.5532068014144897, -0.5059320330619812, -0.45865729451179504, -0.4113825559616089, -0.36410778760910034, -0.3168330192565918, -0.26955828070640564, -0.22228354215621948, -0.1750088930130005, -0.12773413956165314, -0.08045938611030579, -0.033184632658958435, 0.014090120792388916, 0.06136487424373627, 0.10863962769508362, 0.15591436624526978, 0.20318913459777832, 0.25046390295028687, 0.297738641500473, 0.3450133800506592, 0.3922881484031677, 0.43956291675567627, 0.4868376553058624, 0.5341123938560486, 0.5813871622085571, 0.6286619305610657, 0.6759366989135742, 0.723211407661438, 0.7704861760139465, 0.8177609443664551, 0.8650356531143188, 0.9123104214668274, 0.9595851898193359, 1.0068598985671997, 1.054134726524353, 1.1014094352722168, 1.1486842632293701, 1.1959589719772339, 1.2432336807250977, 1.290508508682251, 1.3377832174301147]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 6.0, 8.0, 1.0, 5.0, 8.0, 8.0, 10.0, 24.0, 40.0, 70.0, 112.0, 247.0, 427.0, 1053.0, 2708.0, 9236.0, 47682.0, 544414.0, 392522.0, 37958.0, 7805.0, 2415.0, 911.0, 416.0, 185.0, 89.0, 58.0, 37.0, 34.0, 22.0, 9.0, 4.0, 9.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.36328125, -2.291534423828125, -2.21978759765625, -2.148040771484375, -2.0762939453125, -2.004547119140625, -1.93280029296875, -1.861053466796875, -1.789306640625, -1.717559814453125, -1.64581298828125, -1.574066162109375, -1.5023193359375, -1.430572509765625, -1.35882568359375, -1.287078857421875, -1.21533203125, -1.143585205078125, -1.07183837890625, -1.000091552734375, -0.9283447265625, -0.856597900390625, -0.78485107421875, -0.713104248046875, -0.641357421875, -0.569610595703125, -0.49786376953125, -0.426116943359375, -0.3543701171875, -0.282623291015625, -0.21087646484375, -0.139129638671875, -0.0673828125, 0.004364013671875, 0.07611083984375, 0.147857666015625, 0.2196044921875, 0.291351318359375, 0.36309814453125, 0.434844970703125, 0.506591796875, 0.578338623046875, 0.65008544921875, 0.721832275390625, 0.7935791015625, 0.865325927734375, 0.93707275390625, 1.008819580078125, 1.08056640625, 1.152313232421875, 1.22406005859375, 1.295806884765625, 1.3675537109375, 1.439300537109375, 1.51104736328125, 1.582794189453125, 1.654541015625, 1.726287841796875, 1.79803466796875, 1.869781494140625, 1.9415283203125, 2.013275146484375, 2.08502197265625, 2.156768798828125, 2.228515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 6.0, 9.0, 10.0, 7.0, 16.0, 26.0, 29.0, 49.0, 61.0, 67.0, 84.0, 103.0, 108.0, 103.0, 80.0, 67.0, 50.0, 36.0, 20.0, 15.0, 17.0, 5.0, 12.0, 10.0, 2.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.333831787109375, -4.21063232421875, -4.087432861328125, -3.9642333984375, -3.841033935546875, -3.71783447265625, -3.594635009765625, -3.471435546875, -3.348236083984375, -3.22503662109375, -3.101837158203125, -2.9786376953125, -2.855438232421875, -2.73223876953125, -2.609039306640625, -2.48583984375, -2.362640380859375, -2.23944091796875, -2.116241455078125, -1.9930419921875, -1.869842529296875, -1.74664306640625, -1.623443603515625, -1.500244140625, -1.377044677734375, -1.25384521484375, -1.130645751953125, -1.0074462890625, -0.884246826171875, -0.76104736328125, -0.637847900390625, -0.5146484375, -0.391448974609375, -0.26824951171875, -0.145050048828125, -0.0218505859375, 0.101348876953125, 0.22454833984375, 0.347747802734375, 0.470947265625, 0.594146728515625, 0.71734619140625, 0.840545654296875, 0.9637451171875, 1.086944580078125, 1.21014404296875, 1.333343505859375, 1.45654296875, 1.579742431640625, 1.70294189453125, 1.826141357421875, 1.9493408203125, 2.072540283203125, 2.19573974609375, 2.318939208984375, 2.442138671875, 2.565338134765625, 2.68853759765625, 2.811737060546875, 2.9349365234375, 3.058135986328125, 3.18133544921875, 3.304534912109375, 3.427734375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 8.0, 14.0, 9.0, 16.0, 21.0, 37.0, 39.0, 69.0, 88.0, 139.0, 234.0, 464.0, 1009.0, 2396.0, 6806.0, 28996.0, 251687.0, 671477.0, 66143.0, 12187.0, 3668.0, 1457.0, 643.0, 343.0, 211.0, 132.0, 92.0, 57.0, 32.0, 21.0, 17.0, 15.0, 5.0, 4.0, 6.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.716796875, -1.6666259765625, -1.616455078125, -1.5662841796875, -1.51611328125, -1.4659423828125, -1.415771484375, -1.3656005859375, -1.3154296875, -1.2652587890625, -1.215087890625, -1.1649169921875, -1.11474609375, -1.0645751953125, -1.014404296875, -0.9642333984375, -0.9140625, -0.8638916015625, -0.813720703125, -0.7635498046875, -0.71337890625, -0.6632080078125, -0.613037109375, -0.5628662109375, -0.5126953125, -0.4625244140625, -0.412353515625, -0.3621826171875, -0.31201171875, -0.2618408203125, -0.211669921875, -0.1614990234375, -0.111328125, -0.0611572265625, -0.010986328125, 0.0391845703125, 0.08935546875, 0.1395263671875, 0.189697265625, 0.2398681640625, 0.2900390625, 0.3402099609375, 0.390380859375, 0.4405517578125, 0.49072265625, 0.5408935546875, 0.591064453125, 0.6412353515625, 0.69140625, 0.7415771484375, 0.791748046875, 0.8419189453125, 0.89208984375, 0.9422607421875, 0.992431640625, 1.0426025390625, 1.0927734375, 1.1429443359375, 1.193115234375, 1.2432861328125, 1.29345703125, 1.3436279296875, 1.393798828125, 1.4439697265625, 1.494140625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 8.0, 7.0, 12.0, 13.0, 7.0, 18.0, 14.0, 24.0, 35.0, 29.0, 31.0, 35.0, 34.0, 29.0, 42.0, 34.0, 44.0, 45.0, 43.0, 40.0, 42.0, 46.0, 32.0, 43.0, 30.0, 34.0, 33.0, 34.0, 18.0, 24.0, 14.0, 16.0, 15.0, 16.0, 14.0, 12.0, 9.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.57421875, -2.496307373046875, -2.41839599609375, -2.340484619140625, -2.2625732421875, -2.184661865234375, -2.10675048828125, -2.028839111328125, -1.950927734375, -1.873016357421875, -1.79510498046875, -1.717193603515625, -1.6392822265625, -1.561370849609375, -1.48345947265625, -1.405548095703125, -1.32763671875, -1.249725341796875, -1.17181396484375, -1.093902587890625, -1.0159912109375, -0.938079833984375, -0.86016845703125, -0.782257080078125, -0.704345703125, -0.626434326171875, -0.54852294921875, -0.470611572265625, -0.3927001953125, -0.314788818359375, -0.23687744140625, -0.158966064453125, -0.0810546875, -0.003143310546875, 0.07476806640625, 0.152679443359375, 0.2305908203125, 0.308502197265625, 0.38641357421875, 0.464324951171875, 0.542236328125, 0.620147705078125, 0.69805908203125, 0.775970458984375, 0.8538818359375, 0.931793212890625, 1.00970458984375, 1.087615966796875, 1.16552734375, 1.243438720703125, 1.32135009765625, 1.399261474609375, 1.4771728515625, 1.555084228515625, 1.63299560546875, 1.710906982421875, 1.788818359375, 1.866729736328125, 1.94464111328125, 2.022552490234375, 2.1004638671875, 2.178375244140625, 2.25628662109375, 2.334197998046875, 2.412109375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 8.0, 9.0, 17.0, 15.0, 25.0, 38.0, 60.0, 63.0, 122.0, 220.0, 324.0, 590.0, 1020.0, 2150.0, 4881.0, 14190.0, 56598.0, 506699.0, 392307.0, 47994.0, 12444.0, 4387.0, 2006.0, 969.0, 525.0, 328.0, 183.0, 118.0, 82.0, 43.0, 36.0, 24.0, 19.0, 12.0, 6.0, 8.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51904296875, -0.5022735595703125, -0.485504150390625, -0.4687347412109375, -0.45196533203125, -0.4351959228515625, -0.418426513671875, -0.4016571044921875, -0.3848876953125, -0.3681182861328125, -0.351348876953125, -0.3345794677734375, -0.31781005859375, -0.3010406494140625, -0.284271240234375, -0.2675018310546875, -0.250732421875, -0.2339630126953125, -0.217193603515625, -0.2004241943359375, -0.18365478515625, -0.1668853759765625, -0.150115966796875, -0.1333465576171875, -0.1165771484375, -0.0998077392578125, -0.083038330078125, -0.0662689208984375, -0.04949951171875, -0.0327301025390625, -0.015960693359375, 0.0008087158203125, 0.017578125, 0.0343475341796875, 0.051116943359375, 0.0678863525390625, 0.08465576171875, 0.1014251708984375, 0.118194580078125, 0.1349639892578125, 0.1517333984375, 0.1685028076171875, 0.185272216796875, 0.2020416259765625, 0.21881103515625, 0.2355804443359375, 0.252349853515625, 0.2691192626953125, 0.285888671875, 0.3026580810546875, 0.319427490234375, 0.3361968994140625, 0.35296630859375, 0.3697357177734375, 0.386505126953125, 0.4032745361328125, 0.4200439453125, 0.4368133544921875, 0.453582763671875, 0.4703521728515625, 0.48712158203125, 0.5038909912109375, 0.520660400390625, 0.5374298095703125, 0.55419921875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 5.0, 8.0, 8.0, 12.0, 19.0, 27.0, 30.0, 44.0, 78.0, 115.0, 177.0, 176.0, 102.0, 57.0, 45.0, 38.0, 17.0, 15.0, 10.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013184547424316406, -0.00012817233800888062, -0.00012449920177459717, -0.00012082606554031372, -0.00011715292930603027, -0.00011347979307174683, -0.00010980665683746338, -0.00010613352060317993, -0.00010246038436889648, -9.878724813461304e-05, -9.511411190032959e-05, -9.144097566604614e-05, -8.77678394317627e-05, -8.409470319747925e-05, -8.04215669631958e-05, -7.674843072891235e-05, -7.30752944946289e-05, -6.940215826034546e-05, -6.572902202606201e-05, -6.205588579177856e-05, -5.838274955749512e-05, -5.470961332321167e-05, -5.103647708892822e-05, -4.7363340854644775e-05, -4.369020462036133e-05, -4.001706838607788e-05, -3.6343932151794434e-05, -3.2670795917510986e-05, -2.899765968322754e-05, -2.5324523448944092e-05, -2.1651387214660645e-05, -1.7978250980377197e-05, -1.430511474609375e-05, -1.0631978511810303e-05, -6.9588422775268555e-06, -3.285706043243408e-06, 3.8743019104003906e-07, 4.060566425323486e-06, 7.733702659606934e-06, 1.1406838893890381e-05, 1.5079975128173828e-05, 1.8753111362457275e-05, 2.2426247596740723e-05, 2.609938383102417e-05, 2.9772520065307617e-05, 3.3445656299591064e-05, 3.711879253387451e-05, 4.079192876815796e-05, 4.4465065002441406e-05, 4.8138201236724854e-05, 5.18113374710083e-05, 5.548447370529175e-05, 5.9157609939575195e-05, 6.283074617385864e-05, 6.650388240814209e-05, 7.017701864242554e-05, 7.385015487670898e-05, 7.752329111099243e-05, 8.119642734527588e-05, 8.486956357955933e-05, 8.854269981384277e-05, 9.221583604812622e-05, 9.588897228240967e-05, 9.956210851669312e-05, 0.00010323524475097656]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 11.0, 8.0, 17.0, 28.0, 35.0, 50.0, 62.0, 93.0, 157.0, 291.0, 557.0, 1118.0, 2561.0, 6594.0, 23215.0, 142424.0, 733657.0, 107320.0, 19797.0, 5922.0, 2336.0, 992.0, 537.0, 298.0, 152.0, 108.0, 61.0, 24.0, 36.0, 26.0, 17.0, 14.0, 8.0, 8.0, 3.0, 2.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5654296875, -0.5468521118164062, -0.5282745361328125, -0.5096969604492188, -0.491119384765625, -0.47254180908203125, -0.4539642333984375, -0.43538665771484375, -0.41680908203125, -0.39823150634765625, -0.3796539306640625, -0.36107635498046875, -0.342498779296875, -0.32392120361328125, -0.3053436279296875, -0.28676605224609375, -0.2681884765625, -0.24961090087890625, -0.2310333251953125, -0.21245574951171875, -0.193878173828125, -0.17530059814453125, -0.1567230224609375, -0.13814544677734375, -0.11956787109375, -0.10099029541015625, -0.0824127197265625, -0.06383514404296875, -0.045257568359375, -0.02667999267578125, -0.0081024169921875, 0.01047515869140625, 0.029052734375, 0.04763031005859375, 0.0662078857421875, 0.08478546142578125, 0.103363037109375, 0.12194061279296875, 0.1405181884765625, 0.15909576416015625, 0.17767333984375, 0.19625091552734375, 0.2148284912109375, 0.23340606689453125, 0.251983642578125, 0.27056121826171875, 0.2891387939453125, 0.30771636962890625, 0.3262939453125, 0.34487152099609375, 0.3634490966796875, 0.38202667236328125, 0.400604248046875, 0.41918182373046875, 0.4377593994140625, 0.45633697509765625, 0.47491455078125, 0.49349212646484375, 0.5120697021484375, 0.5306472778320312, 0.549224853515625, 0.5678024291992188, 0.5863800048828125, 0.6049575805664062, 0.62353515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 7.0, 3.0, 5.0, 5.0, 2.0, 7.0, 12.0, 11.0, 11.0, 18.0, 28.0, 33.0, 37.0, 63.0, 111.0, 137.0, 141.0, 95.0, 71.0, 44.0, 38.0, 20.0, 18.0, 15.0, 14.0, 13.0, 6.0, 11.0, 6.0, 5.0, 4.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2929363250732422, -0.2843589782714844, -0.27578163146972656, -0.26720428466796875, -0.25862693786621094, -0.2500495910644531, -0.2414722442626953, -0.2328948974609375, -0.2243175506591797, -0.21574020385742188, -0.20716285705566406, -0.19858551025390625, -0.19000816345214844, -0.18143081665039062, -0.1728534698486328, -0.164276123046875, -0.1556987762451172, -0.14712142944335938, -0.13854408264160156, -0.12996673583984375, -0.12138938903808594, -0.11281204223632812, -0.10423469543457031, -0.0956573486328125, -0.08708000183105469, -0.07850265502929688, -0.06992530822753906, -0.06134796142578125, -0.05277061462402344, -0.044193267822265625, -0.03561592102050781, -0.02703857421875, -0.018461227416992188, -0.009883880615234375, -0.0013065338134765625, 0.00727081298828125, 0.015848159790039062, 0.024425506591796875, 0.03300285339355469, 0.0415802001953125, 0.05015754699707031, 0.058734893798828125, 0.06731224060058594, 0.07588958740234375, 0.08446693420410156, 0.09304428100585938, 0.10162162780761719, 0.110198974609375, 0.11877632141113281, 0.12735366821289062, 0.13593101501464844, 0.14450836181640625, 0.15308570861816406, 0.16166305541992188, 0.1702404022216797, 0.1788177490234375, 0.1873950958251953, 0.19597244262695312, 0.20454978942871094, 0.21312713623046875, 0.22170448303222656, 0.23028182983398438, 0.2388591766357422, 0.2474365234375]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 3.0, 22.0, 47.0, 135.0, 295.0, 312.0, 110.0, 43.0, 12.0, 9.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.425975322723389, -6.11962890625, -5.813282012939453, -5.506935119628906, -5.200588703155518, -4.894242286682129, -4.587895393371582, -4.281548500061035, -3.9752020835876465, -3.6688554286956787, -3.362508773803711, -3.056162118911743, -2.7498154640197754, -2.4434688091278076, -2.13712215423584, -1.830775499343872, -1.5244288444519043, -1.2180821895599365, -0.9117355346679688, -0.605388879776001, -0.2990422248840332, 0.00730443000793457, 0.31365108489990234, 0.6199977397918701, 0.9263443946838379, 1.2326910495758057, 1.5390377044677734, 1.8453843593597412, 2.151731014251709, 2.4580776691436768, 2.7644243240356445, 3.0707709789276123, 3.377117156982422, 3.6834638118743896, 3.9898104667663574, 4.296156883239746, 4.602503776550293, 4.90885066986084, 5.2151970863342285, 5.521543502807617, 5.827890396118164, 6.134237289428711, 6.4405837059021, 6.746930122375488, 7.053277015686035, 7.359623908996582, 7.665970325469971, 7.972316741943359, 8.278663635253906, 8.585010528564453, 8.891357421875, 9.19770336151123, 9.504050254821777, 9.810397148132324, 10.116743087768555, 10.423089981079102, 10.729436874389648, 11.035783767700195, 11.342130661010742, 11.648476600646973, 11.95482349395752, 12.261170387268066, 12.567516326904297, 12.873863220214844, 13.18021011352539]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 1.0, 3.0, 6.0, 4.0, 10.0, 17.0, 14.0, 17.0, 21.0, 33.0, 38.0, 32.0, 32.0, 45.0, 34.0, 39.0, 55.0, 46.0, 46.0, 64.0, 46.0, 41.0, 31.0, 48.0, 40.0, 36.0, 40.0, 32.0, 21.0, 23.0, 12.0, 10.0, 11.0, 8.0, 12.0, 5.0, 6.0, 8.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.931207656860352, -4.767642498016357, -4.604077339172363, -4.440511703491211, -4.276946544647217, -4.113381385803223, -3.9498162269592285, -3.7862510681152344, -3.622685670852661, -3.459120512008667, -3.2955551147460938, -3.1319899559020996, -2.9684247970581055, -2.8048593997955322, -2.641294240951538, -2.477728843688965, -2.3141636848449707, -2.1505985260009766, -1.9870331287384033, -1.8234679698944092, -1.6599026918411255, -1.4963374137878418, -1.3327722549438477, -1.169206976890564, -1.0056416988372803, -0.8420764207839966, -0.6785112023353577, -0.5149459838867188, -0.35138070583343506, -0.18781542778015137, -0.02425020933151245, 0.13931500911712646, 0.30288076400756836, 0.46644601225852966, 0.630011260509491, 0.7935764789581299, 0.9571417570114136, 1.1207070350646973, 1.2842721939086914, 1.447837471961975, 1.6114027500152588, 1.7749680280685425, 1.9385333061218262, 2.1020984649658203, 2.2656636238098145, 2.4292290210723877, 2.592794179916382, 2.756359577178955, 2.919924736022949, 3.0834898948669434, 3.2470552921295166, 3.4106204509735107, 3.574185848236084, 3.737751007080078, 3.9013161659240723, 4.064881324768066, 4.228446960449219, 4.392012119293213, 4.555577278137207, 4.719142913818359, 4.8827080726623535, 5.046273231506348, 5.209838390350342, 5.373403549194336, 5.53696870803833]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 8.0, 21.0, 12.0, 24.0, 41.0, 54.0, 95.0, 130.0, 222.0, 329.0, 530.0, 1034.0, 2102.0, 4562.0, 12014.0, 40901.0, 241521.0, 3350249.0, 455626.0, 57713.0, 15877.0, 5669.0, 2432.0, 1314.0, 691.0, 409.0, 248.0, 142.0, 106.0, 71.0, 40.0, 29.0, 21.0, 14.0, 12.0, 5.0, 7.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.10546875, -2.0446624755859375, -1.983856201171875, -1.9230499267578125, -1.86224365234375, -1.8014373779296875, -1.740631103515625, -1.6798248291015625, -1.6190185546875, -1.5582122802734375, -1.497406005859375, -1.4365997314453125, -1.37579345703125, -1.3149871826171875, -1.254180908203125, -1.1933746337890625, -1.132568359375, -1.0717620849609375, -1.010955810546875, -0.9501495361328125, -0.88934326171875, -0.8285369873046875, -0.767730712890625, -0.7069244384765625, -0.6461181640625, -0.5853118896484375, -0.524505615234375, -0.4636993408203125, -0.40289306640625, -0.3420867919921875, -0.281280517578125, -0.2204742431640625, -0.15966796875, -0.0988616943359375, -0.038055419921875, 0.0227508544921875, 0.08355712890625, 0.1443634033203125, 0.205169677734375, 0.2659759521484375, 0.3267822265625, 0.3875885009765625, 0.448394775390625, 0.5092010498046875, 0.57000732421875, 0.6308135986328125, 0.691619873046875, 0.7524261474609375, 0.813232421875, 0.8740386962890625, 0.934844970703125, 0.9956512451171875, 1.05645751953125, 1.1172637939453125, 1.178070068359375, 1.2388763427734375, 1.2996826171875, 1.3604888916015625, 1.421295166015625, 1.4821014404296875, 1.54290771484375, 1.6037139892578125, 1.664520263671875, 1.7253265380859375, 1.7861328125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 6.0, 2.0, 10.0, 7.0, 6.0, 17.0, 26.0, 27.0, 40.0, 51.0, 33.0, 73.0, 74.0, 106.0, 97.0, 103.0, 70.0, 51.0, 44.0, 33.0, 28.0, 23.0, 13.0, 11.0, 12.0, 6.0, 6.0, 9.0, 4.0, 1.0, 3.0, 3.0, 1.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.94140625, -1.88287353515625, -1.8243408203125, -1.76580810546875, -1.707275390625, -1.64874267578125, -1.5902099609375, -1.53167724609375, -1.47314453125, -1.41461181640625, -1.3560791015625, -1.29754638671875, -1.239013671875, -1.18048095703125, -1.1219482421875, -1.06341552734375, -1.0048828125, -0.94635009765625, -0.8878173828125, -0.82928466796875, -0.770751953125, -0.71221923828125, -0.6536865234375, -0.59515380859375, -0.53662109375, -0.47808837890625, -0.4195556640625, -0.36102294921875, -0.302490234375, -0.24395751953125, -0.1854248046875, -0.12689208984375, -0.068359375, -0.00982666015625, 0.0487060546875, 0.10723876953125, 0.165771484375, 0.22430419921875, 0.2828369140625, 0.34136962890625, 0.39990234375, 0.45843505859375, 0.5169677734375, 0.57550048828125, 0.634033203125, 0.69256591796875, 0.7510986328125, 0.80963134765625, 0.8681640625, 0.92669677734375, 0.9852294921875, 1.04376220703125, 1.102294921875, 1.16082763671875, 1.2193603515625, 1.27789306640625, 1.33642578125, 1.39495849609375, 1.4534912109375, 1.51202392578125, 1.570556640625, 1.62908935546875, 1.6876220703125, 1.74615478515625, 1.8046875]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 9.0, 9.0, 15.0, 18.0, 47.0, 70.0, 103.0, 162.0, 343.0, 703.0, 1704.0, 4956.0, 19306.0, 142036.0, 3686048.0, 298418.0, 29479.0, 6695.0, 2141.0, 905.0, 450.0, 234.0, 177.0, 85.0, 48.0, 26.0, 18.0, 21.0, 10.0, 9.0, 10.0, 4.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.945556640625, -1.86962890625, -1.793701171875, -1.7177734375, -1.641845703125, -1.56591796875, -1.489990234375, -1.4140625, -1.338134765625, -1.26220703125, -1.186279296875, -1.1103515625, -1.034423828125, -0.95849609375, -0.882568359375, -0.806640625, -0.730712890625, -0.65478515625, -0.578857421875, -0.5029296875, -0.427001953125, -0.35107421875, -0.275146484375, -0.19921875, -0.123291015625, -0.04736328125, 0.028564453125, 0.1044921875, 0.180419921875, 0.25634765625, 0.332275390625, 0.408203125, 0.484130859375, 0.56005859375, 0.635986328125, 0.7119140625, 0.787841796875, 0.86376953125, 0.939697265625, 1.015625, 1.091552734375, 1.16748046875, 1.243408203125, 1.3193359375, 1.395263671875, 1.47119140625, 1.547119140625, 1.623046875, 1.698974609375, 1.77490234375, 1.850830078125, 1.9267578125, 2.002685546875, 2.07861328125, 2.154541015625, 2.23046875, 2.306396484375, 2.38232421875, 2.458251953125, 2.5341796875, 2.610107421875, 2.68603515625, 2.761962890625, 2.837890625]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 5.0, 5.0, 13.0, 11.0, 12.0, 7.0, 25.0, 24.0, 32.0, 42.0, 57.0, 64.0, 78.0, 99.0, 196.0, 290.0, 611.0, 1078.0, 515.0, 306.0, 169.0, 128.0, 79.0, 49.0, 52.0, 31.0, 26.0, 23.0, 11.0, 14.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.54541015625, -0.5312004089355469, -0.5169906616210938, -0.5027809143066406, -0.4885711669921875, -0.4743614196777344, -0.46015167236328125, -0.4459419250488281, -0.431732177734375, -0.4175224304199219, -0.40331268310546875, -0.3891029357910156, -0.3748931884765625, -0.3606834411621094, -0.34647369384765625, -0.3322639465332031, -0.31805419921875, -0.3038444519042969, -0.28963470458984375, -0.2754249572753906, -0.2612152099609375, -0.24700546264648438, -0.23279571533203125, -0.21858596801757812, -0.204376220703125, -0.19016647338867188, -0.17595672607421875, -0.16174697875976562, -0.1475372314453125, -0.13332748413085938, -0.11911773681640625, -0.10490798950195312, -0.0906982421875, -0.07648849487304688, -0.06227874755859375, -0.048069000244140625, -0.0338592529296875, -0.019649505615234375, -0.00543975830078125, 0.008769989013671875, 0.022979736328125, 0.037189483642578125, 0.05139923095703125, 0.06560897827148438, 0.0798187255859375, 0.09402847290039062, 0.10823822021484375, 0.12244796752929688, 0.13665771484375, 0.15086746215820312, 0.16507720947265625, 0.17928695678710938, 0.1934967041015625, 0.20770645141601562, 0.22191619873046875, 0.23612594604492188, 0.250335693359375, 0.2645454406738281, 0.27875518798828125, 0.2929649353027344, 0.3071746826171875, 0.3213844299316406, 0.33559417724609375, 0.3498039245605469, 0.364013671875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 9.0, 13.0, 27.0, 35.0, 73.0, 162.0, 200.0, 204.0, 121.0, 60.0, 28.0, 22.0, 14.0, 9.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.757080554962158, -4.624705791473389, -4.492331504821777, -4.359956741333008, -4.227581977844238, -4.095207691192627, -3.9628329277038574, -3.830458402633667, -3.6980838775634766, -3.565709352493286, -3.4333345890045166, -3.300960063934326, -3.1685855388641357, -3.0362110137939453, -2.903836250305176, -2.7714617252349854, -2.639086961746216, -2.5067124366760254, -2.374337673187256, -2.2419631481170654, -2.109588623046875, -1.977213978767395, -1.844839334487915, -1.7124648094177246, -1.5800901651382446, -1.4477155208587646, -1.3153409957885742, -1.1829663515090942, -1.0505917072296143, -0.9182171821594238, -0.7858425378799438, -0.6534679532051086, -0.5210931301116943, -0.38871854543685913, -0.25634393095970154, -0.12396931648254395, 0.00840526819229126, 0.14077985286712646, 0.27315449714660645, 0.40552908182144165, 0.5379036664962769, 0.6702782511711121, 0.8026528358459473, 0.9350274801254272, 1.0674021244049072, 1.1997766494750977, 1.3321512937545776, 1.4645259380340576, 1.596900463104248, 1.729275107383728, 1.8616496324539185, 1.9940242767333984, 2.126398801803589, 2.2587733268737793, 2.391148090362549, 2.5235226154327393, 2.6558971405029297, 2.78827166557312, 2.9206464290618896, 3.05302095413208, 3.1853954792022705, 3.317770004272461, 3.4501447677612305, 3.582519292831421, 3.7148940563201904]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 6.0, 4.0, 3.0, 9.0, 12.0, 19.0, 27.0, 33.0, 45.0, 39.0, 48.0, 50.0, 73.0, 73.0, 71.0, 68.0, 81.0, 67.0, 52.0, 38.0, 35.0, 25.0, 26.0, 29.0, 18.0, 8.0, 7.0, 6.0, 9.0, 6.0, 3.0, 3.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.036879539489746, -1.9790717363357544, -1.9212639331817627, -1.863456130027771, -1.8056483268737793, -1.7478405237197876, -1.690032720565796, -1.6322249174118042, -1.5744171142578125, -1.5166093111038208, -1.458801507949829, -1.4009937047958374, -1.3431859016418457, -1.285378098487854, -1.2275702953338623, -1.1697624921798706, -1.111954689025879, -1.0541468858718872, -0.9963390827178955, -0.9385312795639038, -0.8807234764099121, -0.8229156732559204, -0.7651078701019287, -0.707300066947937, -0.6494922637939453, -0.5916844606399536, -0.5338766574859619, -0.4760688543319702, -0.4182610511779785, -0.3604532480239868, -0.3026454448699951, -0.24483764171600342, -0.18702971935272217, -0.12922191619873047, -0.07141411304473877, -0.01360630989074707, 0.04420149326324463, 0.10200929641723633, 0.15981709957122803, 0.21762490272521973, 0.2754327058792114, 0.3332405090332031, 0.3910483121871948, 0.4488561153411865, 0.5066639184951782, 0.5644717216491699, 0.6222795248031616, 0.6800873279571533, 0.737895131111145, 0.7957029342651367, 0.8535107374191284, 0.9113185405731201, 0.9691263437271118, 1.0269341468811035, 1.0847419500350952, 1.142549753189087, 1.2003575563430786, 1.2581653594970703, 1.315973162651062, 1.3737809658050537, 1.4315887689590454, 1.489396572113037, 1.5472043752670288, 1.6050121784210205, 1.6628199815750122]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 6.0, 4.0, 7.0, 8.0, 13.0, 13.0, 29.0, 22.0, 40.0, 81.0, 137.0, 252.0, 548.0, 1326.0, 3814.0, 14931.0, 92254.0, 752152.0, 154175.0, 20794.0, 5024.0, 1604.0, 640.0, 287.0, 148.0, 86.0, 53.0, 30.0, 23.0, 11.0, 16.0, 6.0, 4.0, 9.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1826171875, -0.17644882202148438, -0.17028045654296875, -0.16411209106445312, -0.1579437255859375, -0.15177536010742188, -0.14560699462890625, -0.13943862915039062, -0.133270263671875, -0.12710189819335938, -0.12093353271484375, -0.11476516723632812, -0.1085968017578125, -0.10242843627929688, -0.09626007080078125, -0.09009170532226562, -0.08392333984375, -0.07775497436523438, -0.07158660888671875, -0.06541824340820312, -0.0592498779296875, -0.053081512451171875, -0.04691314697265625, -0.040744781494140625, -0.034576416015625, -0.028408050537109375, -0.02223968505859375, -0.016071319580078125, -0.0099029541015625, -0.003734588623046875, 0.00243377685546875, 0.008602142333984375, 0.0147705078125, 0.020938873291015625, 0.02710723876953125, 0.033275604248046875, 0.0394439697265625, 0.045612335205078125, 0.05178070068359375, 0.057949066162109375, 0.064117431640625, 0.07028579711914062, 0.07645416259765625, 0.08262252807617188, 0.0887908935546875, 0.09495925903320312, 0.10112762451171875, 0.10729598999023438, 0.11346435546875, 0.11963272094726562, 0.12580108642578125, 0.13196945190429688, 0.1381378173828125, 0.14430618286132812, 0.15047454833984375, 0.15664291381835938, 0.162811279296875, 0.16897964477539062, 0.17514801025390625, 0.18131637573242188, 0.1874847412109375, 0.19365310668945312, 0.19982147216796875, 0.20598983764648438, 0.212158203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 4.0, 8.0, 7.0, 8.0, 10.0, 11.0, 24.0, 36.0, 30.0, 38.0, 50.0, 66.0, 54.0, 97.0, 83.0, 83.0, 75.0, 56.0, 61.0, 41.0, 25.0, 29.0, 22.0, 20.0, 13.0, 6.0, 10.0, 10.0, 3.0, 4.0, 4.0, 5.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.474609375, -1.433349609375, -1.39208984375, -1.350830078125, -1.3095703125, -1.268310546875, -1.22705078125, -1.185791015625, -1.14453125, -1.103271484375, -1.06201171875, -1.020751953125, -0.9794921875, -0.938232421875, -0.89697265625, -0.855712890625, -0.814453125, -0.773193359375, -0.73193359375, -0.690673828125, -0.6494140625, -0.608154296875, -0.56689453125, -0.525634765625, -0.484375, -0.443115234375, -0.40185546875, -0.360595703125, -0.3193359375, -0.278076171875, -0.23681640625, -0.195556640625, -0.154296875, -0.113037109375, -0.07177734375, -0.030517578125, 0.0107421875, 0.052001953125, 0.09326171875, 0.134521484375, 0.17578125, 0.217041015625, 0.25830078125, 0.299560546875, 0.3408203125, 0.382080078125, 0.42333984375, 0.464599609375, 0.505859375, 0.547119140625, 0.58837890625, 0.629638671875, 0.6708984375, 0.712158203125, 0.75341796875, 0.794677734375, 0.8359375, 0.877197265625, 0.91845703125, 0.959716796875, 1.0009765625, 1.042236328125, 1.08349609375, 1.124755859375, 1.166015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 1.0, 3.0, 6.0, 6.0, 12.0, 10.0, 12.0, 13.0, 23.0, 35.0, 33.0, 56.0, 84.0, 120.0, 204.0, 344.0, 933.0, 3299.0, 21889.0, 350177.0, 626302.0, 38411.0, 4559.0, 982.0, 335.0, 235.0, 166.0, 78.0, 60.0, 50.0, 23.0, 21.0, 17.0, 22.0, 7.0, 10.0, 5.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18212890625, -0.1767902374267578, -0.17145156860351562, -0.16611289978027344, -0.16077423095703125, -0.15543556213378906, -0.15009689331054688, -0.1447582244873047, -0.1394195556640625, -0.1340808868408203, -0.12874221801757812, -0.12340354919433594, -0.11806488037109375, -0.11272621154785156, -0.10738754272460938, -0.10204887390136719, -0.096710205078125, -0.09137153625488281, -0.08603286743164062, -0.08069419860839844, -0.07535552978515625, -0.07001686096191406, -0.06467819213867188, -0.05933952331542969, -0.0540008544921875, -0.04866218566894531, -0.043323516845703125, -0.03798484802246094, -0.03264617919921875, -0.027307510375976562, -0.021968841552734375, -0.016630172729492188, -0.01129150390625, -0.0059528350830078125, -0.000614166259765625, 0.0047245025634765625, 0.01006317138671875, 0.015401840209960938, 0.020740509033203125, 0.026079177856445312, 0.0314178466796875, 0.03675651550292969, 0.042095184326171875, 0.04743385314941406, 0.05277252197265625, 0.05811119079589844, 0.06344985961914062, 0.06878852844238281, 0.074127197265625, 0.07946586608886719, 0.08480453491210938, 0.09014320373535156, 0.09548187255859375, 0.10082054138183594, 0.10615921020507812, 0.11149787902832031, 0.1168365478515625, 0.12217521667480469, 0.12751388549804688, 0.13285255432128906, 0.13819122314453125, 0.14352989196777344, 0.14886856079101562, 0.1542072296142578, 0.1595458984375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 7.0, 5.0, 7.0, 14.0, 6.0, 8.0, 19.0, 23.0, 22.0, 29.0, 36.0, 26.0, 47.0, 57.0, 58.0, 65.0, 48.0, 60.0, 58.0, 68.0, 54.0, 43.0, 42.0, 39.0, 25.0, 22.0, 20.0, 19.0, 14.0, 13.0, 12.0, 7.0, 13.0, 5.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9677734375, -1.908416748046875, -1.84906005859375, -1.789703369140625, -1.7303466796875, -1.670989990234375, -1.61163330078125, -1.552276611328125, -1.492919921875, -1.433563232421875, -1.37420654296875, -1.314849853515625, -1.2554931640625, -1.196136474609375, -1.13677978515625, -1.077423095703125, -1.01806640625, -0.958709716796875, -0.89935302734375, -0.839996337890625, -0.7806396484375, -0.721282958984375, -0.66192626953125, -0.602569580078125, -0.543212890625, -0.483856201171875, -0.42449951171875, -0.365142822265625, -0.3057861328125, -0.246429443359375, -0.18707275390625, -0.127716064453125, -0.068359375, -0.009002685546875, 0.05035400390625, 0.109710693359375, 0.1690673828125, 0.228424072265625, 0.28778076171875, 0.347137451171875, 0.406494140625, 0.465850830078125, 0.52520751953125, 0.584564208984375, 0.6439208984375, 0.703277587890625, 0.76263427734375, 0.821990966796875, 0.88134765625, 0.940704345703125, 1.00006103515625, 1.059417724609375, 1.1187744140625, 1.178131103515625, 1.23748779296875, 1.296844482421875, 1.356201171875, 1.415557861328125, 1.47491455078125, 1.534271240234375, 1.5936279296875, 1.652984619140625, 1.71234130859375, 1.771697998046875, 1.8310546875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 8.0, 16.0, 23.0, 31.0, 42.0, 60.0, 93.0, 131.0, 254.0, 450.0, 1085.0, 3937.0, 58084.0, 950372.0, 29106.0, 2893.0, 862.0, 404.0, 199.0, 144.0, 94.0, 66.0, 38.0, 34.0, 33.0, 22.0, 11.0, 11.0, 9.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035736083984375, -0.034697532653808594, -0.03365898132324219, -0.03262042999267578, -0.031581878662109375, -0.03054332733154297, -0.029504776000976562, -0.028466224670410156, -0.02742767333984375, -0.026389122009277344, -0.025350570678710938, -0.02431201934814453, -0.023273468017578125, -0.02223491668701172, -0.021196365356445312, -0.020157814025878906, -0.0191192626953125, -0.018080711364746094, -0.017042160034179688, -0.01600360870361328, -0.014965057373046875, -0.013926506042480469, -0.012887954711914062, -0.011849403381347656, -0.01081085205078125, -0.009772300720214844, -0.008733749389648438, -0.007695198059082031, -0.006656646728515625, -0.005618095397949219, -0.0045795440673828125, -0.0035409927368164062, -0.00250244140625, -0.0014638900756835938, -0.0004253387451171875, 0.0006132125854492188, 0.001651763916015625, 0.0026903152465820312, 0.0037288665771484375, 0.004767417907714844, 0.00580596923828125, 0.006844520568847656, 0.007883071899414062, 0.008921623229980469, 0.009960174560546875, 0.010998725891113281, 0.012037277221679688, 0.013075828552246094, 0.0141143798828125, 0.015152931213378906, 0.016191482543945312, 0.01723003387451172, 0.018268585205078125, 0.01930713653564453, 0.020345687866210938, 0.021384239196777344, 0.02242279052734375, 0.023461341857910156, 0.024499893188476562, 0.02553844451904297, 0.026576995849609375, 0.02761554718017578, 0.028654098510742188, 0.029692649841308594, 0.030731201171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 12.0, 13.0, 12.0, 28.0, 33.0, 67.0, 90.0, 127.0, 179.0, 141.0, 105.0, 62.0, 47.0, 28.0, 22.0, 7.0, 10.0, 4.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.722574234008789e-05, -1.66427344083786e-05, -1.605972647666931e-05, -1.5476718544960022e-05, -1.4893710613250732e-05, -1.4310702681541443e-05, -1.3727694749832153e-05, -1.3144686818122864e-05, -1.2561678886413574e-05, -1.1978670954704285e-05, -1.1395663022994995e-05, -1.0812655091285706e-05, -1.0229647159576416e-05, -9.646639227867126e-06, -9.063631296157837e-06, -8.480623364448547e-06, -7.897615432739258e-06, -7.314607501029968e-06, -6.731599569320679e-06, -6.148591637611389e-06, -5.5655837059021e-06, -4.98257577419281e-06, -4.3995678424835205e-06, -3.816559910774231e-06, -3.2335519790649414e-06, -2.650544047355652e-06, -2.0675361156463623e-06, -1.4845281839370728e-06, -9.015202522277832e-07, -3.1851232051849365e-07, 2.644956111907959e-07, 8.475035429000854e-07, 1.430511474609375e-06, 2.0135194063186646e-06, 2.596527338027954e-06, 3.1795352697372437e-06, 3.762543201446533e-06, 4.345551133155823e-06, 4.928559064865112e-06, 5.511566996574402e-06, 6.094574928283691e-06, 6.677582859992981e-06, 7.2605907917022705e-06, 7.84359872341156e-06, 8.42660665512085e-06, 9.00961458683014e-06, 9.592622518539429e-06, 1.0175630450248718e-05, 1.0758638381958008e-05, 1.1341646313667297e-05, 1.1924654245376587e-05, 1.2507662177085876e-05, 1.3090670108795166e-05, 1.3673678040504456e-05, 1.4256685972213745e-05, 1.4839693903923035e-05, 1.5422701835632324e-05, 1.6005709767341614e-05, 1.6588717699050903e-05, 1.7171725630760193e-05, 1.7754733562469482e-05, 1.8337741494178772e-05, 1.892074942588806e-05, 1.950375735759735e-05, 2.008676528930664e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 4.0, 11.0, 13.0, 10.0, 11.0, 17.0, 35.0, 22.0, 41.0, 48.0, 74.0, 108.0, 154.0, 226.0, 407.0, 599.0, 1048.0, 1954.0, 4097.0, 9904.0, 33842.0, 221509.0, 671376.0, 73457.0, 17108.0, 6201.0, 2668.0, 1387.0, 754.0, 477.0, 283.0, 181.0, 143.0, 104.0, 68.0, 52.0, 41.0, 28.0, 20.0, 21.0, 15.0, 6.0, 3.0, 7.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022613525390625, -0.021889686584472656, -0.021165847778320312, -0.02044200897216797, -0.019718170166015625, -0.01899433135986328, -0.018270492553710938, -0.017546653747558594, -0.01682281494140625, -0.016098976135253906, -0.015375137329101562, -0.014651298522949219, -0.013927459716796875, -0.013203620910644531, -0.012479782104492188, -0.011755943298339844, -0.0110321044921875, -0.010308265686035156, -0.009584426879882812, -0.008860588073730469, -0.008136749267578125, -0.007412910461425781, -0.0066890716552734375, -0.005965232849121094, -0.00524139404296875, -0.004517555236816406, -0.0037937164306640625, -0.0030698776245117188, -0.002346038818359375, -0.0016222000122070312, -0.0008983612060546875, -0.00017452239990234375, 0.00054931640625, 0.0012731552124023438, 0.0019969940185546875, 0.0027208328247070312, 0.003444671630859375, 0.004168510437011719, 0.0048923492431640625, 0.005616188049316406, 0.00634002685546875, 0.007063865661621094, 0.0077877044677734375, 0.008511543273925781, 0.009235382080078125, 0.009959220886230469, 0.010683059692382812, 0.011406898498535156, 0.0121307373046875, 0.012854576110839844, 0.013578414916992188, 0.014302253723144531, 0.015026092529296875, 0.01574993133544922, 0.016473770141601562, 0.017197608947753906, 0.01792144775390625, 0.018645286560058594, 0.019369125366210938, 0.02009296417236328, 0.020816802978515625, 0.02154064178466797, 0.022264480590820312, 0.022988319396972656, 0.023712158203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 8.0, 9.0, 13.0, 17.0, 28.0, 44.0, 61.0, 91.0, 118.0, 182.0, 149.0, 91.0, 45.0, 45.0, 30.0, 18.0, 9.0, 6.0, 6.0, 8.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0052490234375, -0.005077719688415527, -0.004906415939331055, -0.004735112190246582, -0.004563808441162109, -0.004392504692077637, -0.004221200942993164, -0.004049897193908691, -0.0038785934448242188, -0.003707289695739746, -0.0035359859466552734, -0.0033646821975708008, -0.003193378448486328, -0.0030220746994018555, -0.002850770950317383, -0.00267946720123291, -0.0025081634521484375, -0.002336859703063965, -0.002165555953979492, -0.0019942522048950195, -0.0018229484558105469, -0.0016516447067260742, -0.0014803409576416016, -0.001309037208557129, -0.0011377334594726562, -0.0009664297103881836, -0.0007951259613037109, -0.0006238222122192383, -0.0004525184631347656, -0.00028121471405029297, -0.00010991096496582031, 6.139278411865234e-05, 0.000232696533203125, 0.00040400028228759766, 0.0005753040313720703, 0.000746607780456543, 0.0009179115295410156, 0.0010892152786254883, 0.001260519027709961, 0.0014318227767944336, 0.0016031265258789062, 0.001774430274963379, 0.0019457340240478516, 0.0021170377731323242, 0.002288341522216797, 0.0024596452713012695, 0.002630949020385742, 0.002802252769470215, 0.0029735565185546875, 0.00314486026763916, 0.003316164016723633, 0.0034874677658081055, 0.003658771514892578, 0.0038300752639770508, 0.0040013790130615234, 0.004172682762145996, 0.004343986511230469, 0.004515290260314941, 0.004686594009399414, 0.004857897758483887, 0.005029201507568359, 0.005200505256652832, 0.005371809005737305, 0.005543112754821777, 0.00571441650390625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 6.0, 4.0, 9.0, 9.0, 21.0, 41.0, 112.0, 257.0, 298.0, 126.0, 60.0, 28.0, 13.0, 8.0, 1.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.628101110458374, -3.511425018310547, -3.3947486877441406, -3.2780725955963135, -3.1613965034484863, -3.044720411300659, -2.928044319152832, -2.811367988586426, -2.6946918964385986, -2.5780158042907715, -2.4613394737243652, -2.344663381576538, -2.227987289428711, -2.111311197280884, -1.994634985923767, -1.8779587745666504, -1.7612826824188232, -1.644606590270996, -1.5279303789138794, -1.4112541675567627, -1.2945780754089355, -1.1779019832611084, -1.0612257719039917, -0.9445496201515198, -0.8278734683990479, -0.7111973166465759, -0.594521164894104, -0.4778450131416321, -0.36116886138916016, -0.24449270963668823, -0.1278165578842163, -0.011140406131744385, 0.10553574562072754, 0.22221189737319946, 0.3388880491256714, 0.4555642008781433, 0.5722403526306152, 0.6889165043830872, 0.8055926561355591, 0.922268807888031, 1.038944959640503, 1.15562105178833, 1.2722972631454468, 1.3889734745025635, 1.5056495666503906, 1.6223256587982178, 1.7390018701553345, 1.8556780815124512, 1.9723541736602783, 2.0890302658081055, 2.2057065963745117, 2.322382688522339, 2.439058780670166, 2.555734872817993, 2.6724109649658203, 2.7890872955322266, 2.9057633876800537, 3.022439479827881, 3.139115810394287, 3.2557919025421143, 3.3724679946899414, 3.4891440868377686, 3.6058201789855957, 3.722496509552002, 3.839172601699829]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 4.0, 6.0, 11.0, 13.0, 23.0, 38.0, 41.0, 46.0, 57.0, 65.0, 84.0, 95.0, 75.0, 92.0, 82.0, 52.0, 43.0, 38.0, 27.0, 20.0, 21.0, 16.0, 5.0, 9.0, 5.0, 7.0, 4.0, 1.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.5767064094543457, -1.5342743396759033, -1.491842269897461, -1.4494102001190186, -1.4069781303405762, -1.3645459413528442, -1.3221138715744019, -1.2796818017959595, -1.237249732017517, -1.1948176622390747, -1.1523855924606323, -1.10995352268219, -1.067521333694458, -1.0250892639160156, -0.9826571941375732, -0.9402251243591309, -0.8977930545806885, -0.8553609848022461, -0.8129289150238037, -0.7704967856407166, -0.7280647158622742, -0.6856326460838318, -0.6432005167007446, -0.6007684469223022, -0.5583363771438599, -0.5159043073654175, -0.4734722077846527, -0.43104010820388794, -0.38860803842544556, -0.3461759686470032, -0.3037438690662384, -0.26131176948547363, -0.21887969970703125, -0.17644761502742767, -0.1340155303478241, -0.09158344566822052, -0.04915136098861694, -0.006719276309013367, 0.03571280837059021, 0.07814490795135498, 0.12057697772979736, 0.16300906240940094, 0.20544114708900452, 0.2478732317686081, 0.29030531644821167, 0.33273738622665405, 0.3751694858074188, 0.4176015853881836, 0.460033655166626, 0.5024657249450684, 0.5448977947235107, 0.5873299241065979, 0.6297619938850403, 0.6721940636634827, 0.7146261930465698, 0.7570582628250122, 0.7994903326034546, 0.841922402381897, 0.8843544721603394, 0.9267866015434265, 0.9692186713218689, 1.011650800704956, 1.0540828704833984, 1.0965149402618408, 1.1389470100402832]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 6.0, 12.0, 8.0, 27.0, 35.0, 50.0, 75.0, 115.0, 150.0, 260.0, 468.0, 736.0, 1313.0, 2383.0, 4664.0, 9711.0, 22715.0, 60260.0, 199949.0, 468273.0, 181027.0, 56150.0, 21153.0, 9251.0, 4313.0, 2324.0, 1256.0, 733.0, 412.0, 250.0, 170.0, 99.0, 66.0, 38.0, 22.0, 22.0, 14.0, 12.0, 4.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83935546875, -0.8134994506835938, -0.7876434326171875, -0.7617874145507812, -0.735931396484375, -0.7100753784179688, -0.6842193603515625, -0.6583633422851562, -0.63250732421875, -0.6066513061523438, -0.5807952880859375, -0.5549392700195312, -0.529083251953125, -0.5032272338867188, -0.4773712158203125, -0.45151519775390625, -0.4256591796875, -0.39980316162109375, -0.3739471435546875, -0.34809112548828125, -0.322235107421875, -0.29637908935546875, -0.2705230712890625, -0.24466705322265625, -0.21881103515625, -0.19295501708984375, -0.1670989990234375, -0.14124298095703125, -0.115386962890625, -0.08953094482421875, -0.0636749267578125, -0.03781890869140625, -0.011962890625, 0.01389312744140625, 0.0397491455078125, 0.06560516357421875, 0.091461181640625, 0.11731719970703125, 0.1431732177734375, 0.16902923583984375, 0.19488525390625, 0.22074127197265625, 0.2465972900390625, 0.27245330810546875, 0.298309326171875, 0.32416534423828125, 0.3500213623046875, 0.37587738037109375, 0.4017333984375, 0.42758941650390625, 0.4534454345703125, 0.47930145263671875, 0.505157470703125, 0.5310134887695312, 0.5568695068359375, 0.5827255249023438, 0.60858154296875, 0.6344375610351562, 0.6602935791015625, 0.6861495971679688, 0.712005615234375, 0.7378616333007812, 0.7637176513671875, 0.7895736694335938, 0.8154296875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 7.0, 7.0, 7.0, 11.0, 13.0, 28.0, 35.0, 44.0, 57.0, 75.0, 70.0, 112.0, 110.0, 100.0, 66.0, 67.0, 48.0, 32.0, 28.0, 19.0, 14.0, 15.0, 8.0, 6.0, 6.0, 4.0, 4.0, 2.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-4.50390625, -4.3897705078125, -4.275634765625, -4.1614990234375, -4.04736328125, -3.9332275390625, -3.819091796875, -3.7049560546875, -3.5908203125, -3.4766845703125, -3.362548828125, -3.2484130859375, -3.13427734375, -3.0201416015625, -2.906005859375, -2.7918701171875, -2.677734375, -2.5635986328125, -2.449462890625, -2.3353271484375, -2.22119140625, -2.1070556640625, -1.992919921875, -1.8787841796875, -1.7646484375, -1.6505126953125, -1.536376953125, -1.4222412109375, -1.30810546875, -1.1939697265625, -1.079833984375, -0.9656982421875, -0.8515625, -0.7374267578125, -0.623291015625, -0.5091552734375, -0.39501953125, -0.2808837890625, -0.166748046875, -0.0526123046875, 0.0615234375, 0.1756591796875, 0.289794921875, 0.4039306640625, 0.51806640625, 0.6322021484375, 0.746337890625, 0.8604736328125, 0.974609375, 1.0887451171875, 1.202880859375, 1.3170166015625, 1.43115234375, 1.5452880859375, 1.659423828125, 1.7735595703125, 1.8876953125, 2.0018310546875, 2.115966796875, 2.2301025390625, 2.34423828125, 2.4583740234375, 2.572509765625, 2.6866455078125, 2.80078125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 5.0, 8.0, 9.0, 7.0, 21.0, 20.0, 22.0, 31.0, 52.0, 49.0, 76.0, 93.0, 154.0, 234.0, 450.0, 773.0, 1635.0, 3860.0, 10608.0, 37541.0, 175318.0, 583892.0, 177260.0, 38197.0, 10911.0, 3803.0, 1598.0, 728.0, 391.0, 262.0, 162.0, 104.0, 65.0, 49.0, 32.0, 26.0, 28.0, 14.0, 18.0, 12.0, 10.0, 8.0, 5.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82373046875, -0.7983856201171875, -0.773040771484375, -0.7476959228515625, -0.72235107421875, -0.6970062255859375, -0.671661376953125, -0.6463165283203125, -0.6209716796875, -0.5956268310546875, -0.570281982421875, -0.5449371337890625, -0.51959228515625, -0.4942474365234375, -0.468902587890625, -0.4435577392578125, -0.418212890625, -0.3928680419921875, -0.367523193359375, -0.3421783447265625, -0.31683349609375, -0.2914886474609375, -0.266143798828125, -0.2407989501953125, -0.2154541015625, -0.1901092529296875, -0.164764404296875, -0.1394195556640625, -0.11407470703125, -0.0887298583984375, -0.063385009765625, -0.0380401611328125, -0.0126953125, 0.0126495361328125, 0.037994384765625, 0.0633392333984375, 0.08868408203125, 0.1140289306640625, 0.139373779296875, 0.1647186279296875, 0.1900634765625, 0.2154083251953125, 0.240753173828125, 0.2660980224609375, 0.29144287109375, 0.3167877197265625, 0.342132568359375, 0.3674774169921875, 0.392822265625, 0.4181671142578125, 0.443511962890625, 0.4688568115234375, 0.49420166015625, 0.5195465087890625, 0.544891357421875, 0.5702362060546875, 0.5955810546875, 0.6209259033203125, 0.646270751953125, 0.6716156005859375, 0.69696044921875, 0.7223052978515625, 0.747650146484375, 0.7729949951171875, 0.79833984375]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 4.0, 7.0, 6.0, 16.0, 12.0, 15.0, 15.0, 18.0, 14.0, 27.0, 25.0, 37.0, 30.0, 44.0, 33.0, 43.0, 50.0, 50.0, 54.0, 56.0, 46.0, 47.0, 50.0, 37.0, 36.0, 36.0, 24.0, 24.0, 21.0, 19.0, 22.0, 21.0, 16.0, 10.0, 4.0, 4.0, 4.0, 7.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0], "bins": [-3.189453125, -3.103912353515625, -3.01837158203125, -2.932830810546875, -2.8472900390625, -2.761749267578125, -2.67620849609375, -2.590667724609375, -2.505126953125, -2.419586181640625, -2.33404541015625, -2.248504638671875, -2.1629638671875, -2.077423095703125, -1.99188232421875, -1.906341552734375, -1.82080078125, -1.735260009765625, -1.64971923828125, -1.564178466796875, -1.4786376953125, -1.393096923828125, -1.30755615234375, -1.222015380859375, -1.136474609375, -1.050933837890625, -0.96539306640625, -0.879852294921875, -0.7943115234375, -0.708770751953125, -0.62322998046875, -0.537689208984375, -0.4521484375, -0.366607666015625, -0.28106689453125, -0.195526123046875, -0.1099853515625, -0.024444580078125, 0.06109619140625, 0.146636962890625, 0.232177734375, 0.317718505859375, 0.40325927734375, 0.488800048828125, 0.5743408203125, 0.659881591796875, 0.74542236328125, 0.830963134765625, 0.91650390625, 1.002044677734375, 1.08758544921875, 1.173126220703125, 1.2586669921875, 1.344207763671875, 1.42974853515625, 1.515289306640625, 1.600830078125, 1.686370849609375, 1.77191162109375, 1.857452392578125, 1.9429931640625, 2.028533935546875, 2.11407470703125, 2.199615478515625, 2.28515625]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 7.0, 6.0, 11.0, 14.0, 33.0, 49.0, 91.0, 164.0, 319.0, 635.0, 1570.0, 4868.0, 23593.0, 251524.0, 693773.0, 58550.0, 8944.0, 2506.0, 909.0, 468.0, 216.0, 120.0, 65.0, 45.0, 26.0, 15.0, 11.0, 10.0, 3.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.572265625, -0.5519866943359375, -0.531707763671875, -0.5114288330078125, -0.49114990234375, -0.4708709716796875, -0.450592041015625, -0.4303131103515625, -0.4100341796875, -0.3897552490234375, -0.369476318359375, -0.3491973876953125, -0.32891845703125, -0.3086395263671875, -0.288360595703125, -0.2680816650390625, -0.247802734375, -0.2275238037109375, -0.207244873046875, -0.1869659423828125, -0.16668701171875, -0.1464080810546875, -0.126129150390625, -0.1058502197265625, -0.0855712890625, -0.0652923583984375, -0.045013427734375, -0.0247344970703125, -0.00445556640625, 0.0158233642578125, 0.036102294921875, 0.0563812255859375, 0.07666015625, 0.0969390869140625, 0.117218017578125, 0.1374969482421875, 0.15777587890625, 0.1780548095703125, 0.198333740234375, 0.2186126708984375, 0.2388916015625, 0.2591705322265625, 0.279449462890625, 0.2997283935546875, 0.32000732421875, 0.3402862548828125, 0.360565185546875, 0.3808441162109375, 0.401123046875, 0.4214019775390625, 0.441680908203125, 0.4619598388671875, 0.48223876953125, 0.5025177001953125, 0.522796630859375, 0.5430755615234375, 0.5633544921875, 0.5836334228515625, 0.603912353515625, 0.6241912841796875, 0.64447021484375, 0.6647491455078125, 0.685028076171875, 0.7053070068359375, 0.7255859375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 3.0, 9.0, 6.0, 9.0, 30.0, 34.0, 39.0, 60.0, 93.0, 124.0, 156.0, 116.0, 99.0, 68.0, 42.0, 35.0, 27.0, 13.0, 7.0, 3.0, 11.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010877847671508789, -0.00010509323328733444, -0.000101407989859581, -9.772274643182755e-05, -9.40375030040741e-05, -9.035225957632065e-05, -8.66670161485672e-05, -8.298177272081375e-05, -7.92965292930603e-05, -7.561128586530685e-05, -7.19260424375534e-05, -6.824079900979996e-05, -6.455555558204651e-05, -6.087031215429306e-05, -5.718506872653961e-05, -5.349982529878616e-05, -4.9814581871032715e-05, -4.6129338443279266e-05, -4.244409501552582e-05, -3.875885158777237e-05, -3.507360816001892e-05, -3.138836473226547e-05, -2.7703121304512024e-05, -2.4017877876758575e-05, -2.0332634449005127e-05, -1.664739102125168e-05, -1.296214759349823e-05, -9.276904165744781e-06, -5.591660737991333e-06, -1.9064173102378845e-06, 1.778826117515564e-06, 5.4640695452690125e-06, 9.149312973022461e-06, 1.283455640077591e-05, 1.6519799828529358e-05, 2.0205043256282806e-05, 2.3890286684036255e-05, 2.7575530111789703e-05, 3.126077353954315e-05, 3.49460169672966e-05, 3.863126039505005e-05, 4.23165038228035e-05, 4.6001747250556946e-05, 4.9686990678310394e-05, 5.337223410606384e-05, 5.705747753381729e-05, 6.074272096157074e-05, 6.442796438932419e-05, 6.811320781707764e-05, 7.179845124483109e-05, 7.548369467258453e-05, 7.916893810033798e-05, 8.285418152809143e-05, 8.653942495584488e-05, 9.022466838359833e-05, 9.390991181135178e-05, 9.759515523910522e-05, 0.00010128039866685867, 0.00010496564209461212, 0.00010865088552236557, 0.00011233612895011902, 0.00011602137237787247, 0.00011970661580562592, 0.00012339185923337936, 0.0001270771026611328]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 10.0, 7.0, 8.0, 22.0, 28.0, 40.0, 52.0, 105.0, 175.0, 292.0, 575.0, 1260.0, 2934.0, 9003.0, 34497.0, 216408.0, 640489.0, 110905.0, 21260.0, 6217.0, 2205.0, 1038.0, 462.0, 225.0, 134.0, 78.0, 48.0, 31.0, 14.0, 9.0, 3.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4258880615234375, -0.410858154296875, -0.3958282470703125, -0.38079833984375, -0.3657684326171875, -0.350738525390625, -0.3357086181640625, -0.3206787109375, -0.3056488037109375, -0.290618896484375, -0.2755889892578125, -0.26055908203125, -0.2455291748046875, -0.230499267578125, -0.2154693603515625, -0.200439453125, -0.1854095458984375, -0.170379638671875, -0.1553497314453125, -0.14031982421875, -0.1252899169921875, -0.110260009765625, -0.0952301025390625, -0.0802001953125, -0.0651702880859375, -0.050140380859375, -0.0351104736328125, -0.02008056640625, -0.0050506591796875, 0.009979248046875, 0.0250091552734375, 0.0400390625, 0.0550689697265625, 0.070098876953125, 0.0851287841796875, 0.10015869140625, 0.1151885986328125, 0.130218505859375, 0.1452484130859375, 0.1602783203125, 0.1753082275390625, 0.190338134765625, 0.2053680419921875, 0.22039794921875, 0.2354278564453125, 0.250457763671875, 0.2654876708984375, 0.280517578125, 0.2955474853515625, 0.310577392578125, 0.3256072998046875, 0.34063720703125, 0.3556671142578125, 0.370697021484375, 0.3857269287109375, 0.4007568359375, 0.4157867431640625, 0.430816650390625, 0.4458465576171875, 0.46087646484375, 0.4759063720703125, 0.490936279296875, 0.5059661865234375, 0.52099609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 7.0, 4.0, 5.0, 6.0, 13.0, 7.0, 16.0, 22.0, 24.0, 27.0, 34.0, 45.0, 63.0, 63.0, 64.0, 85.0, 74.0, 77.0, 62.0, 48.0, 53.0, 40.0, 35.0, 18.0, 22.0, 16.0, 13.0, 16.0, 13.0, 8.0, 6.0, 4.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1866455078125, -0.18062591552734375, -0.1746063232421875, -0.16858673095703125, -0.162567138671875, -0.15654754638671875, -0.1505279541015625, -0.14450836181640625, -0.13848876953125, -0.13246917724609375, -0.1264495849609375, -0.12042999267578125, -0.114410400390625, -0.10839080810546875, -0.1023712158203125, -0.09635162353515625, -0.09033203125, -0.08431243896484375, -0.0782928466796875, -0.07227325439453125, -0.066253662109375, -0.06023406982421875, -0.0542144775390625, -0.04819488525390625, -0.04217529296875, -0.03615570068359375, -0.0301361083984375, -0.02411651611328125, -0.018096923828125, -0.01207733154296875, -0.0060577392578125, -3.814697265625e-05, 0.0059814453125, 0.01200103759765625, 0.0180206298828125, 0.02404022216796875, 0.030059814453125, 0.03607940673828125, 0.0420989990234375, 0.04811859130859375, 0.05413818359375, 0.06015777587890625, 0.0661773681640625, 0.07219696044921875, 0.078216552734375, 0.08423614501953125, 0.0902557373046875, 0.09627532958984375, 0.102294921875, 0.10831451416015625, 0.1143341064453125, 0.12035369873046875, 0.126373291015625, 0.13239288330078125, 0.1384124755859375, 0.14443206787109375, 0.15045166015625, 0.15647125244140625, 0.1624908447265625, 0.16851043701171875, 0.174530029296875, 0.18054962158203125, 0.1865692138671875, 0.19258880615234375, 0.1986083984375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 9.0, 14.0, 26.0, 50.0, 181.0, 336.0, 212.0, 86.0, 44.0, 13.0, 8.0, 8.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.21556282043457, -7.9559326171875, -7.6963019371032715, -7.436671733856201, -7.177041053771973, -6.917410850524902, -6.657780647277832, -6.398150444030762, -6.138519763946533, -5.878889560699463, -5.619258880615234, -5.359628677368164, -5.099998474121094, -4.840367794036865, -4.580737590789795, -4.321106910705566, -4.061476707458496, -3.8018462657928467, -3.5422158241271973, -3.282585620880127, -3.0229551792144775, -2.763324737548828, -2.503694534301758, -2.2440640926361084, -1.984433650970459, -1.7248032093048096, -1.4651728868484497, -1.2055425643920898, -0.9459121227264404, -0.686281681060791, -0.42665135860443115, -0.1670210361480713, 0.09260845184326172, 0.35223883390426636, 0.611869215965271, 0.8714995980262756, 1.1311299800872803, 1.3907604217529297, 1.6503907442092896, 1.9100210666656494, 2.169651508331299, 2.4292819499969482, 2.6889123916625977, 2.948542594909668, 3.2081730365753174, 3.467803478240967, 3.727433681488037, 3.9870641231536865, 4.246694564819336, 4.506324768066406, 4.765955448150635, 5.025585651397705, 5.285216331481934, 5.544846534729004, 5.804476737976074, 6.0641069412231445, 6.323737621307373, 6.583367824554443, 6.842998504638672, 7.102628707885742, 7.3622589111328125, 7.621889591217041, 7.881519794464111, 8.14115047454834, 8.40078067779541]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 6.0, 1.0, 9.0, 9.0, 6.0, 14.0, 20.0, 18.0, 19.0, 17.0, 23.0, 30.0, 36.0, 36.0, 40.0, 40.0, 45.0, 47.0, 29.0, 42.0, 42.0, 51.0, 43.0, 38.0, 50.0, 30.0, 39.0, 30.0, 32.0, 23.0, 19.0, 30.0, 20.0, 12.0, 9.0, 7.0, 9.0, 14.0, 3.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.297725200653076, -5.128629684448242, -4.959534645080566, -4.790439128875732, -4.621343612670898, -4.452248573303223, -4.283153057098389, -4.114057540893555, -3.944962501525879, -3.775867223739624, -3.606771945953369, -3.437676429748535, -3.2685811519622803, -3.0994858741760254, -2.9303903579711914, -2.7612950801849365, -2.5921998023986816, -2.4231045246124268, -2.254009246826172, -2.084913730621338, -1.915818452835083, -1.7467231750488281, -1.5776277780532837, -1.4085323810577393, -1.2394371032714844, -1.0703418254852295, -0.9012464284896851, -0.7321510910987854, -0.5630557537078857, -0.3939604163169861, -0.22486507892608643, -0.05576968193054199, 0.1133260726928711, 0.28242141008377075, 0.4515167474746704, 0.6206120848655701, 0.7897074222564697, 0.9588027596473694, 1.127898097038269, 1.2969934940338135, 1.4660887718200684, 1.6351840496063232, 1.8042794466018677, 1.973374843597412, 2.142470121383667, 2.311565399169922, 2.480660915374756, 2.6497561931610107, 2.8188514709472656, 2.9879467487335205, 3.1570420265197754, 3.3261375427246094, 3.4952328205108643, 3.664328098297119, 3.833423614501953, 4.002518653869629, 4.171614170074463, 4.340709686279297, 4.509804725646973, 4.678900241851807, 4.847995758056641, 5.017090797424316, 5.18618631362915, 5.355281829833984, 5.52437686920166]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 8.0, 12.0, 15.0, 25.0, 37.0, 75.0, 116.0, 202.0, 336.0, 553.0, 1027.0, 2103.0, 4592.0, 12446.0, 44382.0, 303836.0, 3480611.0, 280231.0, 42048.0, 12320.0, 4718.0, 2137.0, 1041.0, 558.0, 338.0, 189.0, 111.0, 70.0, 49.0, 42.0, 22.0, 15.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.326171875, -2.2641143798828125, -2.202056884765625, -2.1399993896484375, -2.07794189453125, -2.0158843994140625, -1.953826904296875, -1.8917694091796875, -1.8297119140625, -1.7676544189453125, -1.705596923828125, -1.6435394287109375, -1.58148193359375, -1.5194244384765625, -1.457366943359375, -1.3953094482421875, -1.333251953125, -1.2711944580078125, -1.209136962890625, -1.1470794677734375, -1.08502197265625, -1.0229644775390625, -0.960906982421875, -0.8988494873046875, -0.8367919921875, -0.7747344970703125, -0.712677001953125, -0.6506195068359375, -0.58856201171875, -0.5265045166015625, -0.464447021484375, -0.4023895263671875, -0.34033203125, -0.2782745361328125, -0.216217041015625, -0.1541595458984375, -0.09210205078125, -0.0300445556640625, 0.032012939453125, 0.0940704345703125, 0.1561279296875, 0.2181854248046875, 0.280242919921875, 0.3423004150390625, 0.40435791015625, 0.4664154052734375, 0.528472900390625, 0.5905303955078125, 0.652587890625, 0.7146453857421875, 0.776702880859375, 0.8387603759765625, 0.90081787109375, 0.9628753662109375, 1.024932861328125, 1.0869903564453125, 1.1490478515625, 1.2111053466796875, 1.273162841796875, 1.3352203369140625, 1.39727783203125, 1.4593353271484375, 1.521392822265625, 1.5834503173828125, 1.6455078125]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 0.0, 7.0, 11.0, 9.0, 15.0, 40.0, 37.0, 55.0, 74.0, 82.0, 127.0, 116.0, 117.0, 82.0, 69.0, 42.0, 29.0, 22.0, 10.0, 12.0, 8.0, 13.0, 7.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.46484375, -2.3991241455078125, -2.333404541015625, -2.2676849365234375, -2.20196533203125, -2.1362457275390625, -2.070526123046875, -2.0048065185546875, -1.9390869140625, -1.8733673095703125, -1.807647705078125, -1.7419281005859375, -1.67620849609375, -1.6104888916015625, -1.544769287109375, -1.4790496826171875, -1.413330078125, -1.3476104736328125, -1.281890869140625, -1.2161712646484375, -1.15045166015625, -1.0847320556640625, -1.019012451171875, -0.9532928466796875, -0.8875732421875, -0.8218536376953125, -0.756134033203125, -0.6904144287109375, -0.62469482421875, -0.5589752197265625, -0.493255615234375, -0.4275360107421875, -0.36181640625, -0.2960968017578125, -0.230377197265625, -0.1646575927734375, -0.09893798828125, -0.0332183837890625, 0.032501220703125, 0.0982208251953125, 0.1639404296875, 0.2296600341796875, 0.295379638671875, 0.3610992431640625, 0.42681884765625, 0.4925384521484375, 0.558258056640625, 0.6239776611328125, 0.689697265625, 0.7554168701171875, 0.821136474609375, 0.8868560791015625, 0.95257568359375, 1.0182952880859375, 1.084014892578125, 1.1497344970703125, 1.2154541015625, 1.2811737060546875, 1.346893310546875, 1.4126129150390625, 1.47833251953125, 1.5440521240234375, 1.609771728515625, 1.6754913330078125, 1.7412109375]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 12.0, 18.0, 20.0, 26.0, 54.0, 81.0, 112.0, 272.0, 534.0, 1409.0, 4343.0, 19394.0, 192026.0, 3807153.0, 146124.0, 16686.0, 3756.0, 1195.0, 486.0, 243.0, 135.0, 73.0, 42.0, 30.0, 20.0, 12.0, 5.0, 9.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.49609375, -3.405181884765625, -3.31427001953125, -3.223358154296875, -3.1324462890625, -3.041534423828125, -2.95062255859375, -2.859710693359375, -2.768798828125, -2.677886962890625, -2.58697509765625, -2.496063232421875, -2.4051513671875, -2.314239501953125, -2.22332763671875, -2.132415771484375, -2.04150390625, -1.950592041015625, -1.85968017578125, -1.768768310546875, -1.6778564453125, -1.586944580078125, -1.49603271484375, -1.405120849609375, -1.314208984375, -1.223297119140625, -1.13238525390625, -1.041473388671875, -0.9505615234375, -0.859649658203125, -0.76873779296875, -0.677825927734375, -0.5869140625, -0.496002197265625, -0.40509033203125, -0.314178466796875, -0.2232666015625, -0.132354736328125, -0.04144287109375, 0.049468994140625, 0.140380859375, 0.231292724609375, 0.32220458984375, 0.413116455078125, 0.5040283203125, 0.594940185546875, 0.68585205078125, 0.776763916015625, 0.86767578125, 0.958587646484375, 1.04949951171875, 1.140411376953125, 1.2313232421875, 1.322235107421875, 1.41314697265625, 1.504058837890625, 1.594970703125, 1.685882568359375, 1.77679443359375, 1.867706298828125, 1.9586181640625, 2.049530029296875, 2.14044189453125, 2.231353759765625, 2.322265625]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 8.0, 5.0, 9.0, 7.0, 10.0, 11.0, 15.0, 20.0, 39.0, 37.0, 49.0, 48.0, 99.0, 146.0, 224.0, 430.0, 1077.0, 812.0, 327.0, 203.0, 136.0, 86.0, 63.0, 58.0, 40.0, 31.0, 21.0, 20.0, 12.0, 7.0, 7.0, 2.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.423583984375, -0.4083671569824219, -0.39315032958984375, -0.3779335021972656, -0.3627166748046875, -0.3474998474121094, -0.33228302001953125, -0.3170661926269531, -0.301849365234375, -0.2866325378417969, -0.27141571044921875, -0.2561988830566406, -0.2409820556640625, -0.22576522827148438, -0.21054840087890625, -0.19533157348632812, -0.18011474609375, -0.16489791870117188, -0.14968109130859375, -0.13446426391601562, -0.1192474365234375, -0.10403060913085938, -0.08881378173828125, -0.07359695434570312, -0.058380126953125, -0.043163299560546875, -0.02794647216796875, -0.012729644775390625, 0.0024871826171875, 0.017704010009765625, 0.03292083740234375, 0.048137664794921875, 0.0633544921875, 0.07857131958007812, 0.09378814697265625, 0.10900497436523438, 0.1242218017578125, 0.13943862915039062, 0.15465545654296875, 0.16987228393554688, 0.185089111328125, 0.20030593872070312, 0.21552276611328125, 0.23073959350585938, 0.2459564208984375, 0.2611732482910156, 0.27639007568359375, 0.2916069030761719, 0.30682373046875, 0.3220405578613281, 0.33725738525390625, 0.3524742126464844, 0.3676910400390625, 0.3829078674316406, 0.39812469482421875, 0.4133415222167969, 0.428558349609375, 0.4437751770019531, 0.45899200439453125, 0.4742088317871094, 0.4894256591796875, 0.5046424865722656, 0.5198593139648438, 0.5350761413574219, 0.55029296875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 4.0, 6.0, 10.0, 23.0, 35.0, 60.0, 100.0, 179.0, 203.0, 160.0, 78.0, 44.0, 37.0, 21.0, 9.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.802375793457031, -4.683100700378418, -4.563825607299805, -4.444550514221191, -4.325275421142578, -4.206000328063965, -4.086725234985352, -3.9674503803253174, -3.848175287246704, -3.728900194168091, -3.6096251010894775, -3.4903500080108643, -3.37107515335083, -3.251800060272217, -3.1325249671936035, -3.0132498741149902, -2.893974781036377, -2.7746996879577637, -2.6554245948791504, -2.536149501800537, -2.416874408721924, -2.2975993156433105, -2.1783244609832764, -2.059049367904663, -1.9397742748260498, -1.8204991817474365, -1.7012240886688232, -1.5819491147994995, -1.4626740217208862, -1.343398928642273, -1.2241239547729492, -1.104848861694336, -0.9855737686157227, -0.8662986755371094, -0.7470236420631409, -0.6277486085891724, -0.5084735155105591, -0.3891984224319458, -0.2699233889579773, -0.1506483554840088, -0.03137326240539551, 0.08790180087089539, 0.20717686414718628, 0.3264519274234772, 0.44572699069976807, 0.5650020837783813, 0.6842771172523499, 0.8035521507263184, 0.9228272438049316, 1.042102336883545, 1.1613774299621582, 1.280652403831482, 1.3999274969100952, 1.5192025899887085, 1.6384775638580322, 1.7577526569366455, 1.8770277500152588, 1.996302843093872, 2.1155779361724854, 2.2348530292510986, 2.354127883911133, 2.473402976989746, 2.5926780700683594, 2.7119531631469727, 2.831228256225586]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 6.0, 8.0, 0.0, 4.0, 6.0, 10.0, 19.0, 19.0, 45.0, 60.0, 56.0, 69.0, 69.0, 69.0, 74.0, 59.0, 80.0, 68.0, 57.0, 45.0, 46.0, 32.0, 29.0, 20.0, 7.0, 6.0, 9.0, 10.0, 9.0, 6.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9878116846084595, -1.927910327911377, -1.8680088520050049, -1.8081074953079224, -1.7482061386108398, -1.6883046627044678, -1.6284033060073853, -1.5685019493103027, -1.5086004734039307, -1.4486991167068481, -1.388797640800476, -1.3288962841033936, -1.268994927406311, -1.2090935707092285, -1.1491920948028564, -1.089290738105774, -1.0293893814086914, -0.9694879651069641, -0.9095866084098816, -0.8496851921081543, -0.7897838354110718, -0.7298824191093445, -0.6699810028076172, -0.6100796461105347, -0.5501782298088074, -0.49027684330940247, -0.43037545680999756, -0.37047404050827026, -0.31057265400886536, -0.25067126750946045, -0.19076985120773315, -0.13086846470832825, -0.07096707820892334, -0.011065684258937836, 0.04883570969104767, 0.10873711109161377, 0.16863849759101868, 0.22853988409042358, 0.2884413003921509, 0.3483426868915558, 0.4082440733909607, 0.4681454598903656, 0.5280468463897705, 0.5879482626914978, 0.6478496789932251, 0.7077510356903076, 0.7676524519920349, 0.8275538682937622, 0.8874552249908447, 0.947356641292572, 1.0072580575942993, 1.0671594142913818, 1.1270607709884644, 1.1869621276855469, 1.246863603591919, 1.3067649602890015, 1.366666316986084, 1.4265676736831665, 1.4864691495895386, 1.546370506286621, 1.6062718629837036, 1.6661732196807861, 1.7260746955871582, 1.7859760522842407, 1.8458775281906128]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 8.0, 5.0, 12.0, 15.0, 21.0, 32.0, 58.0, 98.0, 181.0, 445.0, 1439.0, 6920.0, 78679.0, 895936.0, 56748.0, 5904.0, 1189.0, 426.0, 167.0, 109.0, 46.0, 36.0, 18.0, 13.0, 13.0, 8.0, 7.0, 1.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.410888671875, -0.3996162414550781, -0.38834381103515625, -0.3770713806152344, -0.3657989501953125, -0.3545265197753906, -0.34325408935546875, -0.3319816589355469, -0.320709228515625, -0.3094367980957031, -0.29816436767578125, -0.2868919372558594, -0.2756195068359375, -0.2643470764160156, -0.25307464599609375, -0.24180221557617188, -0.23052978515625, -0.21925735473632812, -0.20798492431640625, -0.19671249389648438, -0.1854400634765625, -0.17416763305664062, -0.16289520263671875, -0.15162277221679688, -0.140350341796875, -0.12907791137695312, -0.11780548095703125, -0.10653305053710938, -0.0952606201171875, -0.08398818969726562, -0.07271575927734375, -0.061443328857421875, -0.0501708984375, -0.038898468017578125, -0.02762603759765625, -0.016353607177734375, -0.0050811767578125, 0.006191253662109375, 0.01746368408203125, 0.028736114501953125, 0.040008544921875, 0.051280975341796875, 0.06255340576171875, 0.07382583618164062, 0.0850982666015625, 0.09637069702148438, 0.10764312744140625, 0.11891555786132812, 0.13018798828125, 0.14146041870117188, 0.15273284912109375, 0.16400527954101562, 0.1752777099609375, 0.18655014038085938, 0.19782257080078125, 0.20909500122070312, 0.220367431640625, 0.23163986206054688, 0.24291229248046875, 0.2541847229003906, 0.2654571533203125, 0.2767295837402344, 0.28800201416015625, 0.2992744445800781, 0.310546875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 3.0, 7.0, 7.0, 11.0, 15.0, 26.0, 35.0, 56.0, 78.0, 83.0, 78.0, 88.0, 80.0, 77.0, 80.0, 62.0, 43.0, 46.0, 29.0, 21.0, 14.0, 10.0, 5.0, 9.0, 5.0, 4.0, 2.0, 9.0, 4.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7041015625, -1.6570587158203125, -1.610015869140625, -1.5629730224609375, -1.51593017578125, -1.4688873291015625, -1.421844482421875, -1.3748016357421875, -1.3277587890625, -1.2807159423828125, -1.233673095703125, -1.1866302490234375, -1.13958740234375, -1.0925445556640625, -1.045501708984375, -0.9984588623046875, -0.951416015625, -0.9043731689453125, -0.857330322265625, -0.8102874755859375, -0.76324462890625, -0.7162017822265625, -0.669158935546875, -0.6221160888671875, -0.5750732421875, -0.5280303955078125, -0.480987548828125, -0.4339447021484375, -0.38690185546875, -0.3398590087890625, -0.292816162109375, -0.2457733154296875, -0.19873046875, -0.1516876220703125, -0.104644775390625, -0.0576019287109375, -0.01055908203125, 0.0364837646484375, 0.083526611328125, 0.1305694580078125, 0.1776123046875, 0.2246551513671875, 0.271697998046875, 0.3187408447265625, 0.36578369140625, 0.4128265380859375, 0.459869384765625, 0.5069122314453125, 0.553955078125, 0.6009979248046875, 0.648040771484375, 0.6950836181640625, 0.74212646484375, 0.7891693115234375, 0.836212158203125, 0.8832550048828125, 0.9302978515625, 0.9773406982421875, 1.024383544921875, 1.0714263916015625, 1.11846923828125, 1.1655120849609375, 1.212554931640625, 1.2595977783203125, 1.306640625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 3.0, 5.0, 11.0, 16.0, 16.0, 25.0, 27.0, 50.0, 73.0, 82.0, 142.0, 224.0, 497.0, 2162.0, 19292.0, 493801.0, 508751.0, 20003.0, 2106.0, 549.0, 244.0, 140.0, 121.0, 59.0, 40.0, 33.0, 24.0, 15.0, 13.0, 9.0, 6.0, 7.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.228759765625, -0.22161102294921875, -0.2144622802734375, -0.20731353759765625, -0.200164794921875, -0.19301605224609375, -0.1858673095703125, -0.17871856689453125, -0.17156982421875, -0.16442108154296875, -0.1572723388671875, -0.15012359619140625, -0.142974853515625, -0.13582611083984375, -0.1286773681640625, -0.12152862548828125, -0.1143798828125, -0.10723114013671875, -0.1000823974609375, -0.09293365478515625, -0.085784912109375, -0.07863616943359375, -0.0714874267578125, -0.06433868408203125, -0.05718994140625, -0.05004119873046875, -0.0428924560546875, -0.03574371337890625, -0.028594970703125, -0.02144622802734375, -0.0142974853515625, -0.00714874267578125, 0.0, 0.00714874267578125, 0.0142974853515625, 0.02144622802734375, 0.028594970703125, 0.03574371337890625, 0.0428924560546875, 0.05004119873046875, 0.05718994140625, 0.06433868408203125, 0.0714874267578125, 0.07863616943359375, 0.085784912109375, 0.09293365478515625, 0.1000823974609375, 0.10723114013671875, 0.1143798828125, 0.12152862548828125, 0.1286773681640625, 0.13582611083984375, 0.142974853515625, 0.15012359619140625, 0.1572723388671875, 0.16442108154296875, 0.17156982421875, 0.17871856689453125, 0.1858673095703125, 0.19301605224609375, 0.200164794921875, 0.20731353759765625, 0.2144622802734375, 0.22161102294921875, 0.228759765625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 5.0, 4.0, 7.0, 7.0, 6.0, 10.0, 15.0, 16.0, 15.0, 28.0, 24.0, 36.0, 46.0, 40.0, 40.0, 46.0, 58.0, 46.0, 49.0, 49.0, 61.0, 53.0, 50.0, 48.0, 37.0, 43.0, 36.0, 27.0, 25.0, 18.0, 12.0, 13.0, 13.0, 9.0, 0.0, 5.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.15234375, -2.0860595703125, -2.019775390625, -1.9534912109375, -1.88720703125, -1.8209228515625, -1.754638671875, -1.6883544921875, -1.6220703125, -1.5557861328125, -1.489501953125, -1.4232177734375, -1.35693359375, -1.2906494140625, -1.224365234375, -1.1580810546875, -1.091796875, -1.0255126953125, -0.959228515625, -0.8929443359375, -0.82666015625, -0.7603759765625, -0.694091796875, -0.6278076171875, -0.5615234375, -0.4952392578125, -0.428955078125, -0.3626708984375, -0.29638671875, -0.2301025390625, -0.163818359375, -0.0975341796875, -0.03125, 0.0350341796875, 0.101318359375, 0.1676025390625, 0.23388671875, 0.3001708984375, 0.366455078125, 0.4327392578125, 0.4990234375, 0.5653076171875, 0.631591796875, 0.6978759765625, 0.76416015625, 0.8304443359375, 0.896728515625, 0.9630126953125, 1.029296875, 1.0955810546875, 1.161865234375, 1.2281494140625, 1.29443359375, 1.3607177734375, 1.427001953125, 1.4932861328125, 1.5595703125, 1.6258544921875, 1.692138671875, 1.7584228515625, 1.82470703125, 1.8909912109375, 1.957275390625, 2.0235595703125, 2.08984375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 3.0, 0.0, 3.0, 7.0, 18.0, 10.0, 23.0, 19.0, 15.0, 29.0, 52.0, 80.0, 204.0, 513.0, 2135.0, 15680.0, 976186.0, 48584.0, 3644.0, 789.0, 252.0, 98.0, 57.0, 26.0, 26.0, 17.0, 17.0, 7.0, 9.0, 8.0, 8.0, 5.0, 7.0, 6.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0518798828125, -0.05006980895996094, -0.048259735107421875, -0.04644966125488281, -0.04463958740234375, -0.04282951354980469, -0.041019439697265625, -0.03920936584472656, -0.0373992919921875, -0.03558921813964844, -0.033779144287109375, -0.03196907043457031, -0.03015899658203125, -0.028348922729492188, -0.026538848876953125, -0.024728775024414062, -0.022918701171875, -0.021108627319335938, -0.019298553466796875, -0.017488479614257812, -0.01567840576171875, -0.013868331909179688, -0.012058258056640625, -0.010248184204101562, -0.0084381103515625, -0.0066280364990234375, -0.004817962646484375, -0.0030078887939453125, -0.00119781494140625, 0.0006122589111328125, 0.002422332763671875, 0.0042324066162109375, 0.00604248046875, 0.007852554321289062, 0.009662628173828125, 0.011472702026367188, 0.01328277587890625, 0.015092849731445312, 0.016902923583984375, 0.018712997436523438, 0.0205230712890625, 0.022333145141601562, 0.024143218994140625, 0.025953292846679688, 0.02776336669921875, 0.029573440551757812, 0.031383514404296875, 0.03319358825683594, 0.035003662109375, 0.03681373596191406, 0.038623809814453125, 0.04043388366699219, 0.04224395751953125, 0.04405403137207031, 0.045864105224609375, 0.04767417907714844, 0.0494842529296875, 0.05129432678222656, 0.053104400634765625, 0.05491447448730469, 0.05672454833984375, 0.05853462219238281, 0.060344696044921875, 0.06215476989746094, 0.06396484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 3.0, 1.0, 5.0, 2.0, 1.0, 4.0, 7.0, 9.0, 14.0, 12.0, 34.0, 47.0, 72.0, 92.0, 90.0, 137.0, 105.0, 112.0, 77.0, 61.0, 40.0, 23.0, 15.0, 12.0, 14.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6570091247558594e-05, -1.61072239279747e-05, -1.5644356608390808e-05, -1.5181489288806915e-05, -1.4718621969223022e-05, -1.425575464963913e-05, -1.3792887330055237e-05, -1.3330020010471344e-05, -1.2867152690887451e-05, -1.2404285371303558e-05, -1.1941418051719666e-05, -1.1478550732135773e-05, -1.101568341255188e-05, -1.0552816092967987e-05, -1.0089948773384094e-05, -9.627081453800201e-06, -9.164214134216309e-06, -8.701346814632416e-06, -8.238479495048523e-06, -7.77561217546463e-06, -7.312744855880737e-06, -6.8498775362968445e-06, -6.387010216712952e-06, -5.924142897129059e-06, -5.461275577545166e-06, -4.998408257961273e-06, -4.53554093837738e-06, -4.0726736187934875e-06, -3.6098062992095947e-06, -3.146938979625702e-06, -2.684071660041809e-06, -2.2212043404579163e-06, -1.7583370208740234e-06, -1.2954697012901306e-06, -8.326023817062378e-07, -3.6973506212234497e-07, 9.313225746154785e-08, 5.559995770454407e-07, 1.0188668966293335e-06, 1.4817342162132263e-06, 1.944601535797119e-06, 2.407468855381012e-06, 2.8703361749649048e-06, 3.3332034945487976e-06, 3.7960708141326904e-06, 4.258938133716583e-06, 4.721805453300476e-06, 5.184672772884369e-06, 5.647540092468262e-06, 6.1104074120521545e-06, 6.573274731636047e-06, 7.03614205121994e-06, 7.499009370803833e-06, 7.961876690387726e-06, 8.424744009971619e-06, 8.887611329555511e-06, 9.350478649139404e-06, 9.813345968723297e-06, 1.027621328830719e-05, 1.0739080607891083e-05, 1.1201947927474976e-05, 1.1664815247058868e-05, 1.2127682566642761e-05, 1.2590549886226654e-05, 1.3053417205810547e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 4.0, 12.0, 11.0, 10.0, 9.0, 15.0, 27.0, 45.0, 77.0, 91.0, 185.0, 382.0, 883.0, 3009.0, 20737.0, 988085.0, 29449.0, 3614.0, 1060.0, 381.0, 177.0, 92.0, 55.0, 39.0, 31.0, 21.0, 17.0, 6.0, 4.0, 8.0, 9.0, 5.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09918212890625, -0.09639263153076172, -0.09360313415527344, -0.09081363677978516, -0.08802413940429688, -0.0852346420288086, -0.08244514465332031, -0.07965564727783203, -0.07686614990234375, -0.07407665252685547, -0.07128715515136719, -0.0684976577758789, -0.06570816040039062, -0.06291866302490234, -0.06012916564941406, -0.05733966827392578, -0.0545501708984375, -0.05176067352294922, -0.04897117614746094, -0.046181678771972656, -0.043392181396484375, -0.040602684020996094, -0.03781318664550781, -0.03502368927001953, -0.03223419189453125, -0.02944469451904297, -0.026655197143554688, -0.023865699768066406, -0.021076202392578125, -0.018286705017089844, -0.015497207641601562, -0.012707710266113281, -0.009918212890625, -0.007128715515136719, -0.0043392181396484375, -0.0015497207641601562, 0.001239776611328125, 0.004029273986816406, 0.0068187713623046875, 0.009608268737792969, 0.01239776611328125, 0.015187263488769531, 0.017976760864257812, 0.020766258239746094, 0.023555755615234375, 0.026345252990722656, 0.029134750366210938, 0.03192424774169922, 0.0347137451171875, 0.03750324249267578, 0.04029273986816406, 0.043082237243652344, 0.045871734619140625, 0.048661231994628906, 0.05145072937011719, 0.05424022674560547, 0.05702972412109375, 0.05981922149658203, 0.06260871887207031, 0.0653982162475586, 0.06818771362304688, 0.07097721099853516, 0.07376670837402344, 0.07655620574951172, 0.079345703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 4.0, 7.0, 6.0, 15.0, 19.0, 28.0, 40.0, 38.0, 74.0, 85.0, 152.0, 169.0, 129.0, 58.0, 57.0, 31.0, 24.0, 12.0, 10.0, 7.0, 5.0, 6.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005611419677734375, -0.005447864532470703, -0.005284309387207031, -0.005120754241943359, -0.0049571990966796875, -0.004793643951416016, -0.004630088806152344, -0.004466533660888672, -0.004302978515625, -0.004139423370361328, -0.003975868225097656, -0.0038123130798339844, -0.0036487579345703125, -0.0034852027893066406, -0.0033216476440429688, -0.003158092498779297, -0.002994537353515625, -0.002830982208251953, -0.0026674270629882812, -0.0025038719177246094, -0.0023403167724609375, -0.0021767616271972656, -0.0020132064819335938, -0.0018496513366699219, -0.00168609619140625, -0.0015225410461425781, -0.0013589859008789062, -0.0011954307556152344, -0.0010318756103515625, -0.0008683204650878906, -0.0007047653198242188, -0.0005412101745605469, -0.000377655029296875, -0.00021409988403320312, -5.054473876953125e-05, 0.00011301040649414062, 0.0002765655517578125, 0.0004401206970214844, 0.0006036758422851562, 0.0007672309875488281, 0.0009307861328125, 0.0010943412780761719, 0.0012578964233398438, 0.0014214515686035156, 0.0015850067138671875, 0.0017485618591308594, 0.0019121170043945312, 0.002075672149658203, 0.002239227294921875, 0.002402782440185547, 0.0025663375854492188, 0.0027298927307128906, 0.0028934478759765625, 0.0030570030212402344, 0.0032205581665039062, 0.003384113311767578, 0.00354766845703125, 0.003711223602294922, 0.0038747787475585938, 0.004038333892822266, 0.0042018890380859375, 0.004365444183349609, 0.004528999328613281, 0.004692554473876953, 0.004856109619140625]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 5.0, 5.0, 9.0, 24.0, 45.0, 69.0, 164.0, 243.0, 199.0, 102.0, 52.0, 33.0, 17.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.527554512023926, -3.431450366973877, -3.335345983505249, -3.2392418384552, -3.1431376934051514, -3.0470335483551025, -2.9509291648864746, -2.854825019836426, -2.758720874786377, -2.662616729736328, -2.5665123462677, -2.4704082012176514, -2.3743040561676025, -2.2781999111175537, -2.182095527648926, -2.085991382598877, -1.9898871183395386, -1.8937828540802002, -1.7976787090301514, -1.701574444770813, -1.6054702997207642, -1.5093660354614258, -1.413261890411377, -1.3171576261520386, -1.2210533618927002, -1.1249490976333618, -1.028844952583313, -0.9327406883239746, -0.8366365432739258, -0.7405322790145874, -0.6444280743598938, -0.5483238697052002, -0.45221972465515137, -0.35611552000045776, -0.26001131534576416, -0.16390708088874817, -0.06780287623405457, 0.028301328420639038, 0.12440556287765503, 0.22050976753234863, 0.31661397218704224, 0.41271817684173584, 0.5088223814964294, 0.604926586151123, 0.7010308504104614, 0.7971349954605103, 0.8932392597198486, 0.9893434643745422, 1.0854476690292358, 1.1815519332885742, 1.277656078338623, 1.3737603425979614, 1.4698644876480103, 1.5659687519073486, 1.6620728969573975, 1.7581771612167358, 1.8542814254760742, 1.9503856897354126, 2.046489953994751, 2.1425940990448, 2.2386982440948486, 2.3348023891448975, 2.4309067726135254, 2.527010917663574, 2.623115062713623]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 4.0, 9.0, 11.0, 24.0, 35.0, 47.0, 65.0, 76.0, 87.0, 80.0, 79.0, 89.0, 76.0, 71.0, 66.0, 42.0, 36.0, 25.0, 12.0, 10.0, 7.0, 8.0, 8.0, 4.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6748292446136475, -1.627956748008728, -1.581084132194519, -1.5342116355895996, -1.4873391389846802, -1.4404665231704712, -1.3935940265655518, -1.3467214107513428, -1.2998489141464233, -1.252976417541504, -1.206103801727295, -1.1592313051223755, -1.112358808517456, -1.065486192703247, -1.0186136960983276, -0.9717411398887634, -0.924868643283844, -0.8779960870742798, -0.8311235904693604, -0.7842510342597961, -0.7373784780502319, -0.6905059814453125, -0.6436334252357483, -0.5967608690261841, -0.5498883724212646, -0.5030158162117004, -0.4561432898044586, -0.4092707633972168, -0.3623982071876526, -0.31552568078041077, -0.26865315437316895, -0.22178059816360474, -0.17490804195404053, -0.1280355006456375, -0.0811629667878151, -0.034290432929992676, 0.01258210837841034, 0.059454649686813354, 0.10632717609405518, 0.15319973230361938, 0.2000722587108612, 0.24694480001926422, 0.29381734132766724, 0.34068986773490906, 0.3875623941421509, 0.4344349503517151, 0.4813074767589569, 0.5281800031661987, 0.5750525593757629, 0.6219251155853271, 0.6687976121902466, 0.7156701683998108, 0.762542724609375, 0.8094152212142944, 0.8562877774238586, 0.9031603336334229, 0.9500328302383423, 0.9969053864479065, 1.0437779426574707, 1.0906504392623901, 1.1375229358673096, 1.1843955516815186, 1.231268048286438, 1.2781405448913574, 1.3250131607055664]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 10.0, 7.0, 15.0, 26.0, 32.0, 55.0, 94.0, 135.0, 227.0, 442.0, 655.0, 1155.0, 2161.0, 4309.0, 9227.0, 23410.0, 72768.0, 407207.0, 411381.0, 73070.0, 23414.0, 9344.0, 4332.0, 2132.0, 1210.0, 703.0, 400.0, 249.0, 144.0, 88.0, 56.0, 36.0, 17.0, 16.0, 12.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82958984375, -0.7964096069335938, -0.7632293701171875, -0.7300491333007812, -0.696868896484375, -0.6636886596679688, -0.6305084228515625, -0.5973281860351562, -0.56414794921875, -0.5309677124023438, -0.4977874755859375, -0.46460723876953125, -0.431427001953125, -0.39824676513671875, -0.3650665283203125, -0.33188629150390625, -0.2987060546875, -0.26552581787109375, -0.2323455810546875, -0.19916534423828125, -0.165985107421875, -0.13280487060546875, -0.0996246337890625, -0.06644439697265625, -0.03326416015625, -8.392333984375e-05, 0.0330963134765625, 0.06627655029296875, 0.099456787109375, 0.13263702392578125, 0.1658172607421875, 0.19899749755859375, 0.232177734375, 0.26535797119140625, 0.2985382080078125, 0.33171844482421875, 0.364898681640625, 0.39807891845703125, 0.4312591552734375, 0.46443939208984375, 0.49761962890625, 0.5307998657226562, 0.5639801025390625, 0.5971603393554688, 0.630340576171875, 0.6635208129882812, 0.6967010498046875, 0.7298812866210938, 0.7630615234375, 0.7962417602539062, 0.8294219970703125, 0.8626022338867188, 0.895782470703125, 0.9289627075195312, 0.9621429443359375, 0.9953231811523438, 1.02850341796875, 1.0616836547851562, 1.0948638916015625, 1.1280441284179688, 1.161224365234375, 1.1944046020507812, 1.2275848388671875, 1.2607650756835938, 1.2939453125]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 7.0, 7.0, 8.0, 9.0, 31.0, 27.0, 31.0, 62.0, 67.0, 78.0, 79.0, 82.0, 85.0, 78.0, 61.0, 73.0, 50.0, 38.0, 31.0, 12.0, 14.0, 7.0, 12.0, 11.0, 10.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.91015625, -2.819305419921875, -2.72845458984375, -2.637603759765625, -2.5467529296875, -2.455902099609375, -2.36505126953125, -2.274200439453125, -2.183349609375, -2.092498779296875, -2.00164794921875, -1.910797119140625, -1.8199462890625, -1.729095458984375, -1.63824462890625, -1.547393798828125, -1.45654296875, -1.365692138671875, -1.27484130859375, -1.183990478515625, -1.0931396484375, -1.002288818359375, -0.91143798828125, -0.820587158203125, -0.729736328125, -0.638885498046875, -0.54803466796875, -0.457183837890625, -0.3663330078125, -0.275482177734375, -0.18463134765625, -0.093780517578125, -0.0029296875, 0.087921142578125, 0.17877197265625, 0.269622802734375, 0.3604736328125, 0.451324462890625, 0.54217529296875, 0.633026123046875, 0.723876953125, 0.814727783203125, 0.90557861328125, 0.996429443359375, 1.0872802734375, 1.178131103515625, 1.26898193359375, 1.359832763671875, 1.45068359375, 1.541534423828125, 1.63238525390625, 1.723236083984375, 1.8140869140625, 1.904937744140625, 1.99578857421875, 2.086639404296875, 2.177490234375, 2.268341064453125, 2.35919189453125, 2.450042724609375, 2.5408935546875, 2.631744384765625, 2.72259521484375, 2.813446044921875, 2.904296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 5.0, 4.0, 2.0, 4.0, 7.0, 12.0, 21.0, 23.0, 40.0, 46.0, 91.0, 114.0, 191.0, 301.0, 570.0, 1117.0, 2716.0, 7586.0, 27192.0, 144858.0, 706525.0, 121590.0, 23683.0, 6800.0, 2508.0, 1089.0, 553.0, 317.0, 169.0, 119.0, 85.0, 69.0, 50.0, 25.0, 15.0, 16.0, 9.0, 10.0, 3.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.029296875, -0.9954986572265625, -0.961700439453125, -0.9279022216796875, -0.89410400390625, -0.8603057861328125, -0.826507568359375, -0.7927093505859375, -0.7589111328125, -0.7251129150390625, -0.691314697265625, -0.6575164794921875, -0.62371826171875, -0.5899200439453125, -0.556121826171875, -0.5223236083984375, -0.488525390625, -0.4547271728515625, -0.420928955078125, -0.3871307373046875, -0.35333251953125, -0.3195343017578125, -0.285736083984375, -0.2519378662109375, -0.2181396484375, -0.1843414306640625, -0.150543212890625, -0.1167449951171875, -0.08294677734375, -0.0491485595703125, -0.015350341796875, 0.0184478759765625, 0.05224609375, 0.0860443115234375, 0.119842529296875, 0.1536407470703125, 0.18743896484375, 0.2212371826171875, 0.255035400390625, 0.2888336181640625, 0.3226318359375, 0.3564300537109375, 0.390228271484375, 0.4240264892578125, 0.45782470703125, 0.4916229248046875, 0.525421142578125, 0.5592193603515625, 0.593017578125, 0.6268157958984375, 0.660614013671875, 0.6944122314453125, 0.72821044921875, 0.7620086669921875, 0.795806884765625, 0.8296051025390625, 0.8634033203125, 0.8972015380859375, 0.930999755859375, 0.9647979736328125, 0.99859619140625, 1.0323944091796875, 1.066192626953125, 1.0999908447265625, 1.1337890625]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 4.0, 6.0, 3.0, 13.0, 9.0, 16.0, 19.0, 17.0, 25.0, 15.0, 28.0, 26.0, 33.0, 39.0, 44.0, 28.0, 34.0, 49.0, 40.0, 45.0, 42.0, 46.0, 37.0, 41.0, 39.0, 40.0, 31.0, 37.0, 32.0, 30.0, 19.0, 16.0, 17.0, 17.0, 11.0, 10.0, 13.0, 10.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9287109375, -1.8623504638671875, -1.795989990234375, -1.7296295166015625, -1.66326904296875, -1.5969085693359375, -1.530548095703125, -1.4641876220703125, -1.3978271484375, -1.3314666748046875, -1.265106201171875, -1.1987457275390625, -1.13238525390625, -1.0660247802734375, -0.999664306640625, -0.9333038330078125, -0.866943359375, -0.8005828857421875, -0.734222412109375, -0.6678619384765625, -0.60150146484375, -0.5351409912109375, -0.468780517578125, -0.4024200439453125, -0.3360595703125, -0.2696990966796875, -0.203338623046875, -0.1369781494140625, -0.07061767578125, -0.0042572021484375, 0.062103271484375, 0.1284637451171875, 0.19482421875, 0.2611846923828125, 0.327545166015625, 0.3939056396484375, 0.46026611328125, 0.5266265869140625, 0.592987060546875, 0.6593475341796875, 0.7257080078125, 0.7920684814453125, 0.858428955078125, 0.9247894287109375, 0.99114990234375, 1.0575103759765625, 1.123870849609375, 1.1902313232421875, 1.256591796875, 1.3229522705078125, 1.389312744140625, 1.4556732177734375, 1.52203369140625, 1.5883941650390625, 1.654754638671875, 1.7211151123046875, 1.7874755859375, 1.8538360595703125, 1.920196533203125, 1.9865570068359375, 2.05291748046875, 2.1192779541015625, 2.185638427734375, 2.2519989013671875, 2.318359375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 4.0, 8.0, 8.0, 11.0, 19.0, 32.0, 21.0, 43.0, 60.0, 91.0, 124.0, 196.0, 262.0, 434.0, 728.0, 1398.0, 2686.0, 6130.0, 16240.0, 56242.0, 319994.0, 540527.0, 70147.0, 19443.0, 7013.0, 3057.0, 1480.0, 791.0, 480.0, 308.0, 186.0, 129.0, 78.0, 59.0, 30.0, 19.0, 13.0, 13.0, 12.0, 7.0, 9.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.41943359375, -0.4063568115234375, -0.393280029296875, -0.3802032470703125, -0.36712646484375, -0.3540496826171875, -0.340972900390625, -0.3278961181640625, -0.3148193359375, -0.3017425537109375, -0.288665771484375, -0.2755889892578125, -0.26251220703125, -0.2494354248046875, -0.236358642578125, -0.2232818603515625, -0.210205078125, -0.1971282958984375, -0.184051513671875, -0.1709747314453125, -0.15789794921875, -0.1448211669921875, -0.131744384765625, -0.1186676025390625, -0.1055908203125, -0.0925140380859375, -0.079437255859375, -0.0663604736328125, -0.05328369140625, -0.0402069091796875, -0.027130126953125, -0.0140533447265625, -0.0009765625, 0.0121002197265625, 0.025177001953125, 0.0382537841796875, 0.05133056640625, 0.0644073486328125, 0.077484130859375, 0.0905609130859375, 0.1036376953125, 0.1167144775390625, 0.129791259765625, 0.1428680419921875, 0.15594482421875, 0.1690216064453125, 0.182098388671875, 0.1951751708984375, 0.208251953125, 0.2213287353515625, 0.234405517578125, 0.2474822998046875, 0.26055908203125, 0.2736358642578125, 0.286712646484375, 0.2997894287109375, 0.3128662109375, 0.3259429931640625, 0.339019775390625, 0.3520965576171875, 0.36517333984375, 0.3782501220703125, 0.391326904296875, 0.4044036865234375, 0.41748046875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 5.0, 4.0, 16.0, 6.0, 13.0, 19.0, 26.0, 25.0, 42.0, 79.0, 102.0, 227.0, 124.0, 84.0, 61.0, 44.0, 38.0, 18.0, 17.0, 10.0, 4.0, 5.0, 8.0, 6.0, 1.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5367431640625e-05, -9.245332330465317e-05, -8.953921496868134e-05, -8.66251066327095e-05, -8.371099829673767e-05, -8.079688996076584e-05, -7.7882781624794e-05, -7.496867328882217e-05, -7.205456495285034e-05, -6.914045661687851e-05, -6.622634828090668e-05, -6.331223994493484e-05, -6.039813160896301e-05, -5.748402327299118e-05, -5.456991493701935e-05, -5.1655806601047516e-05, -4.8741698265075684e-05, -4.582758992910385e-05, -4.291348159313202e-05, -3.999937325716019e-05, -3.7085264921188354e-05, -3.417115658521652e-05, -3.125704824924469e-05, -2.8342939913272858e-05, -2.5428831577301025e-05, -2.2514723241329193e-05, -1.960061490535736e-05, -1.668650656938553e-05, -1.3772398233413696e-05, -1.0858289897441864e-05, -7.944181561470032e-06, -5.0300732254981995e-06, -2.115964889526367e-06, 7.981434464454651e-07, 3.7122517824172974e-06, 6.62636011838913e-06, 9.540468454360962e-06, 1.2454576790332794e-05, 1.5368685126304626e-05, 1.828279346227646e-05, 2.119690179824829e-05, 2.4111010134220123e-05, 2.7025118470191956e-05, 2.9939226806163788e-05, 3.285333514213562e-05, 3.576744347810745e-05, 3.8681551814079285e-05, 4.159566015005112e-05, 4.450976848602295e-05, 4.742387682199478e-05, 5.0337985157966614e-05, 5.3252093493938446e-05, 5.616620182991028e-05, 5.908031016588211e-05, 6.199441850185394e-05, 6.490852683782578e-05, 6.782263517379761e-05, 7.073674350976944e-05, 7.365085184574127e-05, 7.65649601817131e-05, 7.947906851768494e-05, 8.239317685365677e-05, 8.53072851896286e-05, 8.822139352560043e-05, 9.113550186157227e-05]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 6.0, 0.0, 2.0, 2.0, 7.0, 9.0, 10.0, 13.0, 27.0, 30.0, 48.0, 74.0, 107.0, 192.0, 339.0, 598.0, 1184.0, 2562.0, 6246.0, 16551.0, 56927.0, 368911.0, 502095.0, 62860.0, 17857.0, 6456.0, 2768.0, 1220.0, 642.0, 311.0, 187.0, 124.0, 70.0, 47.0, 29.0, 18.0, 10.0, 9.0, 7.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.457763671875, -0.4430122375488281, -0.42826080322265625, -0.4135093688964844, -0.3987579345703125, -0.3840065002441406, -0.36925506591796875, -0.3545036315917969, -0.339752197265625, -0.3250007629394531, -0.31024932861328125, -0.2954978942871094, -0.2807464599609375, -0.2659950256347656, -0.25124359130859375, -0.23649215698242188, -0.22174072265625, -0.20698928833007812, -0.19223785400390625, -0.17748641967773438, -0.1627349853515625, -0.14798355102539062, -0.13323211669921875, -0.11848068237304688, -0.103729248046875, -0.08897781372070312, -0.07422637939453125, -0.059474945068359375, -0.0447235107421875, -0.029972076416015625, -0.01522064208984375, -0.000469207763671875, 0.0142822265625, 0.029033660888671875, 0.04378509521484375, 0.058536529541015625, 0.0732879638671875, 0.08803939819335938, 0.10279083251953125, 0.11754226684570312, 0.132293701171875, 0.14704513549804688, 0.16179656982421875, 0.17654800415039062, 0.1912994384765625, 0.20605087280273438, 0.22080230712890625, 0.23555374145507812, 0.25030517578125, 0.2650566101074219, 0.27980804443359375, 0.2945594787597656, 0.3093109130859375, 0.3240623474121094, 0.33881378173828125, 0.3535652160644531, 0.368316650390625, 0.3830680847167969, 0.39781951904296875, 0.4125709533691406, 0.4273223876953125, 0.4420738220214844, 0.45682525634765625, 0.4715766906738281, 0.486328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 8.0, 4.0, 3.0, 3.0, 15.0, 9.0, 6.0, 20.0, 23.0, 36.0, 29.0, 44.0, 53.0, 85.0, 227.0, 132.0, 63.0, 61.0, 37.0, 26.0, 15.0, 18.0, 20.0, 9.0, 11.0, 11.0, 16.0, 1.0, 5.0, 2.0, 3.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.176025390625, -0.16891098022460938, -0.16179656982421875, -0.15468215942382812, -0.1475677490234375, -0.14045333862304688, -0.13333892822265625, -0.12622451782226562, -0.119110107421875, -0.11199569702148438, -0.10488128662109375, -0.09776687622070312, -0.0906524658203125, -0.08353805541992188, -0.07642364501953125, -0.06930923461914062, -0.06219482421875, -0.055080413818359375, -0.04796600341796875, -0.040851593017578125, -0.0337371826171875, -0.026622772216796875, -0.01950836181640625, -0.012393951416015625, -0.005279541015625, 0.001834869384765625, 0.00894927978515625, 0.016063690185546875, 0.0231781005859375, 0.030292510986328125, 0.03740692138671875, 0.044521331787109375, 0.0516357421875, 0.058750152587890625, 0.06586456298828125, 0.07297897338867188, 0.0800933837890625, 0.08720779418945312, 0.09432220458984375, 0.10143661499023438, 0.108551025390625, 0.11566543579101562, 0.12277984619140625, 0.12989425659179688, 0.1370086669921875, 0.14412307739257812, 0.15123748779296875, 0.15835189819335938, 0.16546630859375, 0.17258071899414062, 0.17969512939453125, 0.18680953979492188, 0.1939239501953125, 0.20103836059570312, 0.20815277099609375, 0.21526718139648438, 0.222381591796875, 0.22949600219726562, 0.23661041259765625, 0.24372482299804688, 0.2508392333984375, 0.2579536437988281, 0.26506805419921875, 0.2721824645996094, 0.279296875]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 3.0, 12.0, 16.0, 63.0, 248.0, 425.0, 173.0, 35.0, 15.0, 8.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.661322593688965, -5.2662577629089355, -4.871192932128906, -4.476128578186035, -4.081063747406006, -3.6859989166259766, -3.2909343242645264, -2.895869731903076, -2.500804901123047, -2.1057400703430176, -1.7106754779815674, -1.3156107664108276, -0.9205460548400879, -0.5254813432693481, -0.1304166316986084, 0.2646479606628418, 0.6597127914428711, 1.0547775030136108, 1.4498422145843506, 1.8449069261550903, 2.23997163772583, 2.6350364685058594, 3.0301010608673096, 3.4251656532287598, 3.820230484008789, 4.215295314788818, 4.610360145568848, 5.005424499511719, 5.400489330291748, 5.795554161071777, 6.190618515014648, 6.585683345794678, 6.980749130249023, 7.375813961029053, 7.770878791809082, 8.165943145751953, 8.56100845336914, 8.956072807312012, 9.351137161254883, 9.74620246887207, 10.141266822814941, 10.536331176757812, 10.931396484375, 11.326460838317871, 11.721525192260742, 12.11659049987793, 12.5116548538208, 12.906719207763672, 13.30178451538086, 13.69684886932373, 14.091914176940918, 14.486978530883789, 14.882043838500977, 15.277108192443848, 15.672172546386719, 16.067237854003906, 16.462303161621094, 16.85736846923828, 17.252431869506836, 17.647497177124023, 18.04256248474121, 18.437625885009766, 18.832691192626953, 19.22775650024414, 19.622819900512695]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 12.0, 6.0, 7.0, 11.0, 24.0, 24.0, 24.0, 43.0, 27.0, 28.0, 29.0, 43.0, 44.0, 32.0, 41.0, 50.0, 55.0, 43.0, 46.0, 35.0, 39.0, 45.0, 37.0, 31.0, 31.0, 34.0, 32.0, 27.0, 14.0, 12.0, 13.0, 5.0, 6.0, 10.0, 5.0, 1.0, 5.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.297745227813721, -4.167235851287842, -4.036726474761963, -3.906216859817505, -3.775707483291626, -3.645198106765747, -3.514688491821289, -3.38417911529541, -3.2536697387695312, -3.1231603622436523, -2.9926509857177734, -2.8621413707733154, -2.7316319942474365, -2.6011226177215576, -2.4706130027770996, -2.3401036262512207, -2.209594249725342, -2.079084873199463, -1.9485753774642944, -1.818065881729126, -1.687556505203247, -1.5570471286773682, -1.4265376329421997, -1.2960281372070312, -1.1655187606811523, -1.0350093841552734, -0.904499888420105, -0.7739904522895813, -0.6434810161590576, -0.5129715800285339, -0.38246214389801025, -0.2519527077674866, -0.12144327163696289, 0.009066164493560791, 0.13957560062408447, 0.27008503675460815, 0.40059447288513184, 0.5311039090156555, 0.6616133451461792, 0.7921227812767029, 0.9226322174072266, 1.0531415939331055, 1.183651089668274, 1.3141605854034424, 1.4446699619293213, 1.5751793384552002, 1.7056888341903687, 1.836198329925537, 1.966707706451416, 2.097217082977295, 2.227726459503174, 2.358236074447632, 2.4887454509735107, 2.6192548274993896, 2.7497644424438477, 2.8802738189697266, 3.0107831954956055, 3.1412925720214844, 3.2718019485473633, 3.4023115634918213, 3.5328209400177, 3.663330316543579, 3.793839931488037, 3.924349308013916, 4.054858684539795]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 19.0, 21.0, 29.0, 35.0, 46.0, 99.0, 132.0, 209.0, 287.0, 626.0, 1182.0, 2502.0, 6461.0, 20827.0, 104570.0, 2887530.0, 1073009.0, 70409.0, 16152.0, 5467.0, 2235.0, 1039.0, 541.0, 314.0, 178.0, 129.0, 71.0, 51.0, 34.0, 24.0, 16.0, 6.0, 5.0, 6.0, 2.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.865234375, -1.798370361328125, -1.73150634765625, -1.664642333984375, -1.5977783203125, -1.530914306640625, -1.46405029296875, -1.397186279296875, -1.330322265625, -1.263458251953125, -1.19659423828125, -1.129730224609375, -1.0628662109375, -0.996002197265625, -0.92913818359375, -0.862274169921875, -0.79541015625, -0.728546142578125, -0.66168212890625, -0.594818115234375, -0.5279541015625, -0.461090087890625, -0.39422607421875, -0.327362060546875, -0.260498046875, -0.193634033203125, -0.12677001953125, -0.059906005859375, 0.0069580078125, 0.073822021484375, 0.14068603515625, 0.207550048828125, 0.2744140625, 0.341278076171875, 0.40814208984375, 0.475006103515625, 0.5418701171875, 0.608734130859375, 0.67559814453125, 0.742462158203125, 0.809326171875, 0.876190185546875, 0.94305419921875, 1.009918212890625, 1.0767822265625, 1.143646240234375, 1.21051025390625, 1.277374267578125, 1.34423828125, 1.411102294921875, 1.47796630859375, 1.544830322265625, 1.6116943359375, 1.678558349609375, 1.74542236328125, 1.812286376953125, 1.879150390625, 1.946014404296875, 2.01287841796875, 2.079742431640625, 2.1466064453125, 2.213470458984375, 2.28033447265625, 2.347198486328125, 2.4140625]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 7.0, 7.0, 9.0, 19.0, 32.0, 24.0, 43.0, 69.0, 80.0, 103.0, 108.0, 102.0, 76.0, 89.0, 49.0, 52.0, 33.0, 28.0, 8.0, 8.0, 8.0, 7.0, 4.0, 4.0, 9.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.216796875, -2.16015625, -2.103515625, -2.046875, -1.990234375, -1.93359375, -1.876953125, -1.8203125, -1.763671875, -1.70703125, -1.650390625, -1.59375, -1.537109375, -1.48046875, -1.423828125, -1.3671875, -1.310546875, -1.25390625, -1.197265625, -1.140625, -1.083984375, -1.02734375, -0.970703125, -0.9140625, -0.857421875, -0.80078125, -0.744140625, -0.6875, -0.630859375, -0.57421875, -0.517578125, -0.4609375, -0.404296875, -0.34765625, -0.291015625, -0.234375, -0.177734375, -0.12109375, -0.064453125, -0.0078125, 0.048828125, 0.10546875, 0.162109375, 0.21875, 0.275390625, 0.33203125, 0.388671875, 0.4453125, 0.501953125, 0.55859375, 0.615234375, 0.671875, 0.728515625, 0.78515625, 0.841796875, 0.8984375, 0.955078125, 1.01171875, 1.068359375, 1.125, 1.181640625, 1.23828125, 1.294921875, 1.3515625, 1.408203125]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 5.0, 3.0, 6.0, 9.0, 8.0, 11.0, 20.0, 32.0, 48.0, 67.0, 99.0, 199.0, 317.0, 664.0, 1631.0, 4874.0, 19090.0, 139369.0, 3667765.0, 318348.0, 30754.0, 6964.0, 2173.0, 868.0, 383.0, 211.0, 113.0, 80.0, 50.0, 42.0, 24.0, 15.0, 12.0, 7.0, 10.0, 6.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.501953125, -2.422882080078125, -2.34381103515625, -2.264739990234375, -2.1856689453125, -2.106597900390625, -2.02752685546875, -1.948455810546875, -1.869384765625, -1.790313720703125, -1.71124267578125, -1.632171630859375, -1.5531005859375, -1.474029541015625, -1.39495849609375, -1.315887451171875, -1.23681640625, -1.157745361328125, -1.07867431640625, -0.999603271484375, -0.9205322265625, -0.841461181640625, -0.76239013671875, -0.683319091796875, -0.604248046875, -0.525177001953125, -0.44610595703125, -0.367034912109375, -0.2879638671875, -0.208892822265625, -0.12982177734375, -0.050750732421875, 0.0283203125, 0.107391357421875, 0.18646240234375, 0.265533447265625, 0.3446044921875, 0.423675537109375, 0.50274658203125, 0.581817626953125, 0.660888671875, 0.739959716796875, 0.81903076171875, 0.898101806640625, 0.9771728515625, 1.056243896484375, 1.13531494140625, 1.214385986328125, 1.29345703125, 1.372528076171875, 1.45159912109375, 1.530670166015625, 1.6097412109375, 1.688812255859375, 1.76788330078125, 1.846954345703125, 1.926025390625, 2.005096435546875, 2.08416748046875, 2.163238525390625, 2.2423095703125, 2.321380615234375, 2.40045166015625, 2.479522705078125, 2.55859375]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 1.0, 6.0, 6.0, 2.0, 10.0, 12.0, 12.0, 13.0, 25.0, 34.0, 40.0, 39.0, 66.0, 84.0, 107.0, 162.0, 303.0, 583.0, 1110.0, 531.0, 302.0, 165.0, 118.0, 81.0, 57.0, 43.0, 39.0, 28.0, 15.0, 15.0, 18.0, 12.0, 9.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.492431640625, -0.47771453857421875, -0.4629974365234375, -0.44828033447265625, -0.433563232421875, -0.41884613037109375, -0.4041290283203125, -0.38941192626953125, -0.37469482421875, -0.35997772216796875, -0.3452606201171875, -0.33054351806640625, -0.315826416015625, -0.30110931396484375, -0.2863922119140625, -0.27167510986328125, -0.2569580078125, -0.24224090576171875, -0.2275238037109375, -0.21280670166015625, -0.198089599609375, -0.18337249755859375, -0.1686553955078125, -0.15393829345703125, -0.13922119140625, -0.12450408935546875, -0.1097869873046875, -0.09506988525390625, -0.080352783203125, -0.06563568115234375, -0.0509185791015625, -0.03620147705078125, -0.021484375, -0.00676727294921875, 0.0079498291015625, 0.02266693115234375, 0.037384033203125, 0.05210113525390625, 0.0668182373046875, 0.08153533935546875, 0.09625244140625, 0.11096954345703125, 0.1256866455078125, 0.14040374755859375, 0.155120849609375, 0.16983795166015625, 0.1845550537109375, 0.19927215576171875, 0.2139892578125, 0.22870635986328125, 0.2434234619140625, 0.25814056396484375, 0.272857666015625, 0.28757476806640625, 0.3022918701171875, 0.31700897216796875, 0.33172607421875, 0.34644317626953125, 0.3611602783203125, 0.37587738037109375, 0.390594482421875, 0.40531158447265625, 0.4200286865234375, 0.43474578857421875, 0.449462890625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 4.0, 8.0, 13.0, 17.0, 20.0, 29.0, 61.0, 99.0, 153.0, 154.0, 146.0, 100.0, 68.0, 47.0, 23.0, 17.0, 8.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.9188547134399414, -3.8170411586761475, -3.7152276039123535, -3.6134138107299805, -3.5116002559661865, -3.4097867012023926, -3.3079731464385986, -3.2061595916748047, -3.1043460369110107, -3.002532482147217, -2.900718927383423, -2.798905372619629, -2.697091579437256, -2.595278024673462, -2.493464469909668, -2.391650915145874, -2.28983736038208, -2.188023805618286, -2.086210250854492, -1.9843965768814087, -1.8825830221176147, -1.7807693481445312, -1.6789557933807373, -1.5771422386169434, -1.4753284454345703, -1.3735148906707764, -1.2717012166976929, -1.169887661933899, -1.068074107170105, -0.9662604928016663, -0.8644468784332275, -0.7626333236694336, -0.6608197689056396, -0.5590061545372009, -0.457192599773407, -0.35537898540496826, -0.25356540083885193, -0.1517518162727356, -0.049938201904296875, 0.05187535285949707, 0.1536889672279358, 0.2555025517940521, 0.35731613636016846, 0.4591297507286072, 0.5609433650970459, 0.6627569198608398, 0.7645705342292786, 0.8663840889930725, 0.9681977033615112, 1.0700112581253052, 1.1718249320983887, 1.2736384868621826, 1.3754520416259766, 1.4772655963897705, 1.579079270362854, 1.680892825126648, 1.7827064990997314, 1.8845200538635254, 1.9863337278366089, 2.0881471633911133, 2.1899609565734863, 2.2917745113372803, 2.393588066101074, 2.495401620864868, 2.597215175628662]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 5.0, 10.0, 8.0, 9.0, 9.0, 20.0, 22.0, 27.0, 35.0, 39.0, 60.0, 59.0, 61.0, 77.0, 70.0, 84.0, 62.0, 74.0, 60.0, 41.0, 33.0, 37.0, 28.0, 21.0, 11.0, 6.0, 8.0, 9.0, 5.0, 7.0, 2.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7186734676361084, -1.662857174873352, -1.6070410013198853, -1.551224708557129, -1.495408535003662, -1.4395922422409058, -1.3837759494781494, -1.3279597759246826, -1.2721436023712158, -1.2163273096084595, -1.1605111360549927, -1.1046948432922363, -1.0488786697387695, -0.9930623769760132, -0.9372461438179016, -0.88142991065979, -0.8256136178970337, -0.7697973847389221, -0.7139811515808105, -0.6581648588180542, -0.6023486852645874, -0.546532392501831, -0.4907161593437195, -0.4348999261856079, -0.37908369302749634, -0.32326745986938477, -0.2674512267112732, -0.21163496375083923, -0.15581873059272766, -0.10000249743461609, -0.04418623447418213, 0.011629998683929443, 0.06744611263275146, 0.12326235324144363, 0.1790785938501358, 0.23489484190940857, 0.29071107506752014, 0.3465273082256317, 0.4023435711860657, 0.45815980434417725, 0.5139760375022888, 0.5697922706604004, 0.625608503818512, 0.6814247369766235, 0.7372410297393799, 0.7930572032928467, 0.848873496055603, 0.9046897292137146, 0.9605059623718262, 1.0163222551345825, 1.0721384286880493, 1.1279547214508057, 1.1837708950042725, 1.2395871877670288, 1.2954034805297852, 1.351219654083252, 1.4070358276367188, 1.462852120399475, 1.518668293952942, 1.5744845867156982, 1.630300760269165, 1.6861170530319214, 1.7419333457946777, 1.7977495193481445, 1.8535658121109009]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 7.0, 6.0, 6.0, 14.0, 13.0, 26.0, 42.0, 85.0, 82.0, 144.0, 282.0, 618.0, 1245.0, 3239.0, 11028.0, 63107.0, 720650.0, 215344.0, 23336.0, 5551.0, 1962.0, 799.0, 363.0, 226.0, 125.0, 76.0, 50.0, 38.0, 22.0, 20.0, 13.0, 7.0, 5.0, 4.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.236083984375, -0.22928810119628906, -0.22249221801757812, -0.2156963348388672, -0.20890045166015625, -0.2021045684814453, -0.19530868530273438, -0.18851280212402344, -0.1817169189453125, -0.17492103576660156, -0.16812515258789062, -0.1613292694091797, -0.15453338623046875, -0.1477375030517578, -0.14094161987304688, -0.13414573669433594, -0.127349853515625, -0.12055397033691406, -0.11375808715820312, -0.10696220397949219, -0.10016632080078125, -0.09337043762207031, -0.08657455444335938, -0.07977867126464844, -0.0729827880859375, -0.06618690490722656, -0.059391021728515625, -0.05259513854980469, -0.04579925537109375, -0.03900337219238281, -0.032207489013671875, -0.025411605834960938, -0.01861572265625, -0.011819839477539062, -0.005023956298828125, 0.0017719268798828125, 0.00856781005859375, 0.015363693237304688, 0.022159576416015625, 0.028955459594726562, 0.0357513427734375, 0.04254722595214844, 0.049343109130859375, 0.05613899230957031, 0.06293487548828125, 0.06973075866699219, 0.07652664184570312, 0.08332252502441406, 0.090118408203125, 0.09691429138183594, 0.10371017456054688, 0.11050605773925781, 0.11730194091796875, 0.12409782409667969, 0.13089370727539062, 0.13768959045410156, 0.1444854736328125, 0.15128135681152344, 0.15807723999023438, 0.1648731231689453, 0.17166900634765625, 0.1784648895263672, 0.18526077270507812, 0.19205665588378906, 0.1988525390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 5.0, 4.0, 7.0, 7.0, 20.0, 13.0, 17.0, 30.0, 33.0, 39.0, 46.0, 63.0, 62.0, 68.0, 70.0, 92.0, 87.0, 63.0, 66.0, 45.0, 32.0, 36.0, 21.0, 24.0, 8.0, 8.0, 6.0, 6.0, 5.0, 5.0, 2.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.162109375, -1.1232147216796875, -1.084320068359375, -1.0454254150390625, -1.00653076171875, -0.9676361083984375, -0.928741455078125, -0.8898468017578125, -0.8509521484375, -0.8120574951171875, -0.773162841796875, -0.7342681884765625, -0.69537353515625, -0.6564788818359375, -0.617584228515625, -0.5786895751953125, -0.539794921875, -0.5009002685546875, -0.462005615234375, -0.4231109619140625, -0.38421630859375, -0.3453216552734375, -0.306427001953125, -0.2675323486328125, -0.2286376953125, -0.1897430419921875, -0.150848388671875, -0.1119537353515625, -0.07305908203125, -0.0341644287109375, 0.004730224609375, 0.0436248779296875, 0.08251953125, 0.1214141845703125, 0.160308837890625, 0.1992034912109375, 0.23809814453125, 0.2769927978515625, 0.315887451171875, 0.3547821044921875, 0.3936767578125, 0.4325714111328125, 0.471466064453125, 0.5103607177734375, 0.54925537109375, 0.5881500244140625, 0.627044677734375, 0.6659393310546875, 0.704833984375, 0.7437286376953125, 0.782623291015625, 0.8215179443359375, 0.86041259765625, 0.8993072509765625, 0.938201904296875, 0.9770965576171875, 1.0159912109375, 1.0548858642578125, 1.093780517578125, 1.1326751708984375, 1.17156982421875, 1.2104644775390625, 1.249359130859375, 1.2882537841796875, 1.3271484375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 3.0, 6.0, 7.0, 9.0, 13.0, 22.0, 27.0, 28.0, 42.0, 52.0, 66.0, 87.0, 115.0, 156.0, 204.0, 283.0, 588.0, 1894.0, 9973.0, 83233.0, 730272.0, 197504.0, 19025.0, 2969.0, 788.0, 372.0, 200.0, 138.0, 113.0, 87.0, 62.0, 49.0, 30.0, 35.0, 19.0, 21.0, 15.0, 11.0, 10.0, 9.0, 4.0, 6.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15380859375, -0.14895248413085938, -0.14409637451171875, -0.13924026489257812, -0.1343841552734375, -0.12952804565429688, -0.12467193603515625, -0.11981582641601562, -0.114959716796875, -0.11010360717773438, -0.10524749755859375, -0.10039138793945312, -0.0955352783203125, -0.09067916870117188, -0.08582305908203125, -0.08096694946289062, -0.07611083984375, -0.07125473022460938, -0.06639862060546875, -0.061542510986328125, -0.0566864013671875, -0.051830291748046875, -0.04697418212890625, -0.042118072509765625, -0.037261962890625, -0.032405853271484375, -0.02754974365234375, -0.022693634033203125, -0.0178375244140625, -0.012981414794921875, -0.00812530517578125, -0.003269195556640625, 0.0015869140625, 0.006443023681640625, 0.01129913330078125, 0.016155242919921875, 0.0210113525390625, 0.025867462158203125, 0.03072357177734375, 0.035579681396484375, 0.040435791015625, 0.045291900634765625, 0.05014801025390625, 0.055004119873046875, 0.0598602294921875, 0.06471633911132812, 0.06957244873046875, 0.07442855834960938, 0.07928466796875, 0.08414077758789062, 0.08899688720703125, 0.09385299682617188, 0.0987091064453125, 0.10356521606445312, 0.10842132568359375, 0.11327743530273438, 0.118133544921875, 0.12298965454101562, 0.12784576416015625, 0.13270187377929688, 0.1375579833984375, 0.14241409301757812, 0.14727020263671875, 0.15212631225585938, 0.156982421875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 9.0, 13.0, 17.0, 18.0, 24.0, 24.0, 17.0, 37.0, 38.0, 29.0, 52.0, 55.0, 43.0, 50.0, 53.0, 67.0, 43.0, 41.0, 41.0, 34.0, 34.0, 35.0, 28.0, 20.0, 14.0, 30.0, 22.0, 19.0, 16.0, 7.0, 17.0, 7.0, 5.0, 5.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6181640625, -1.5694427490234375, -1.520721435546875, -1.4720001220703125, -1.42327880859375, -1.3745574951171875, -1.325836181640625, -1.2771148681640625, -1.2283935546875, -1.1796722412109375, -1.130950927734375, -1.0822296142578125, -1.03350830078125, -0.9847869873046875, -0.936065673828125, -0.8873443603515625, -0.838623046875, -0.7899017333984375, -0.741180419921875, -0.6924591064453125, -0.64373779296875, -0.5950164794921875, -0.546295166015625, -0.4975738525390625, -0.4488525390625, -0.4001312255859375, -0.351409912109375, -0.3026885986328125, -0.25396728515625, -0.2052459716796875, -0.156524658203125, -0.1078033447265625, -0.05908203125, -0.0103607177734375, 0.038360595703125, 0.0870819091796875, 0.13580322265625, 0.1845245361328125, 0.233245849609375, 0.2819671630859375, 0.3306884765625, 0.3794097900390625, 0.428131103515625, 0.4768524169921875, 0.52557373046875, 0.5742950439453125, 0.623016357421875, 0.6717376708984375, 0.720458984375, 0.7691802978515625, 0.817901611328125, 0.8666229248046875, 0.91534423828125, 0.9640655517578125, 1.012786865234375, 1.0615081787109375, 1.1102294921875, 1.1589508056640625, 1.207672119140625, 1.2563934326171875, 1.30511474609375, 1.3538360595703125, 1.402557373046875, 1.4512786865234375, 1.5]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 4.0, 8.0, 8.0, 6.0, 12.0, 11.0, 16.0, 21.0, 22.0, 13.0, 29.0, 40.0, 59.0, 79.0, 118.0, 169.0, 272.0, 476.0, 1165.0, 3460.0, 19860.0, 586532.0, 413508.0, 17108.0, 3207.0, 1059.0, 458.0, 232.0, 166.0, 108.0, 59.0, 70.0, 48.0, 40.0, 22.0, 16.0, 16.0, 11.0, 7.0, 7.0, 6.0, 5.0, 4.0, 8.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.03173828125, -0.03077554702758789, -0.02981281280517578, -0.028850078582763672, -0.027887344360351562, -0.026924610137939453, -0.025961875915527344, -0.024999141693115234, -0.024036407470703125, -0.023073673248291016, -0.022110939025878906, -0.021148204803466797, -0.020185470581054688, -0.019222736358642578, -0.01826000213623047, -0.01729726791381836, -0.01633453369140625, -0.01537179946899414, -0.014409065246582031, -0.013446331024169922, -0.012483596801757812, -0.011520862579345703, -0.010558128356933594, -0.009595394134521484, -0.008632659912109375, -0.007669925689697266, -0.006707191467285156, -0.005744457244873047, -0.0047817230224609375, -0.003818988800048828, -0.0028562545776367188, -0.0018935203552246094, -0.0009307861328125, 3.1948089599609375e-05, 0.0009946823120117188, 0.001957416534423828, 0.0029201507568359375, 0.003882884979248047, 0.004845619201660156, 0.005808353424072266, 0.006771087646484375, 0.007733821868896484, 0.008696556091308594, 0.009659290313720703, 0.010622024536132812, 0.011584758758544922, 0.012547492980957031, 0.01351022720336914, 0.01447296142578125, 0.01543569564819336, 0.01639842987060547, 0.017361164093017578, 0.018323898315429688, 0.019286632537841797, 0.020249366760253906, 0.021212100982666016, 0.022174835205078125, 0.023137569427490234, 0.024100303649902344, 0.025063037872314453, 0.026025772094726562, 0.026988506317138672, 0.02795124053955078, 0.02891397476196289, 0.029876708984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 5.0, 7.0, 8.0, 11.0, 13.0, 20.0, 43.0, 73.0, 139.0, 171.0, 172.0, 131.0, 70.0, 53.0, 23.0, 8.0, 13.0, 8.0, 4.0, 5.0, 3.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2695789337158203e-05, -1.2025237083435059e-05, -1.1354684829711914e-05, -1.068413257598877e-05, -1.0013580322265625e-05, -9.34302806854248e-06, -8.672475814819336e-06, -8.001923561096191e-06, -7.331371307373047e-06, -6.660819053649902e-06, -5.990266799926758e-06, -5.319714546203613e-06, -4.649162292480469e-06, -3.978610038757324e-06, -3.3080577850341797e-06, -2.637505531311035e-06, -1.9669532775878906e-06, -1.296401023864746e-06, -6.258487701416016e-07, 4.470348358154297e-08, 7.152557373046875e-07, 1.385807991027832e-06, 2.0563602447509766e-06, 2.726912498474121e-06, 3.3974647521972656e-06, 4.06801700592041e-06, 4.738569259643555e-06, 5.409121513366699e-06, 6.079673767089844e-06, 6.750226020812988e-06, 7.420778274536133e-06, 8.091330528259277e-06, 8.761882781982422e-06, 9.432435035705566e-06, 1.0102987289428711e-05, 1.0773539543151855e-05, 1.1444091796875e-05, 1.2114644050598145e-05, 1.2785196304321289e-05, 1.3455748558044434e-05, 1.4126300811767578e-05, 1.4796853065490723e-05, 1.5467405319213867e-05, 1.6137957572937012e-05, 1.6808509826660156e-05, 1.74790620803833e-05, 1.8149614334106445e-05, 1.882016658782959e-05, 1.9490718841552734e-05, 2.016127109527588e-05, 2.0831823348999023e-05, 2.1502375602722168e-05, 2.2172927856445312e-05, 2.2843480110168457e-05, 2.35140323638916e-05, 2.4184584617614746e-05, 2.485513687133789e-05, 2.5525689125061035e-05, 2.619624137878418e-05, 2.6866793632507324e-05, 2.753734588623047e-05, 2.8207898139953613e-05, 2.8878450393676758e-05, 2.9549002647399902e-05, 3.0219554901123047e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 9.0, 7.0, 12.0, 11.0, 9.0, 16.0, 27.0, 35.0, 35.0, 61.0, 84.0, 126.0, 154.0, 263.0, 406.0, 741.0, 1593.0, 3861.0, 13132.0, 83005.0, 853407.0, 72150.0, 12308.0, 3627.0, 1492.0, 728.0, 382.0, 233.0, 169.0, 125.0, 91.0, 73.0, 41.0, 42.0, 21.0, 14.0, 16.0, 10.0, 6.0, 7.0, 11.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.043182373046875, -0.04196500778198242, -0.040747642517089844, -0.039530277252197266, -0.03831291198730469, -0.03709554672241211, -0.03587818145751953, -0.03466081619262695, -0.033443450927734375, -0.0322260856628418, -0.03100872039794922, -0.02979135513305664, -0.028573989868164062, -0.027356624603271484, -0.026139259338378906, -0.024921894073486328, -0.02370452880859375, -0.022487163543701172, -0.021269798278808594, -0.020052433013916016, -0.018835067749023438, -0.01761770248413086, -0.01640033721923828, -0.015182971954345703, -0.013965606689453125, -0.012748241424560547, -0.011530876159667969, -0.01031351089477539, -0.009096145629882812, -0.007878780364990234, -0.006661415100097656, -0.005444049835205078, -0.0042266845703125, -0.003009319305419922, -0.0017919540405273438, -0.0005745887756347656, 0.0006427764892578125, 0.0018601417541503906, 0.0030775070190429688, 0.004294872283935547, 0.005512237548828125, 0.006729602813720703, 0.007946968078613281, 0.00916433334350586, 0.010381698608398438, 0.011599063873291016, 0.012816429138183594, 0.014033794403076172, 0.01525115966796875, 0.016468524932861328, 0.017685890197753906, 0.018903255462646484, 0.020120620727539062, 0.02133798599243164, 0.02255535125732422, 0.023772716522216797, 0.024990081787109375, 0.026207447052001953, 0.02742481231689453, 0.02864217758178711, 0.029859542846679688, 0.031076908111572266, 0.032294273376464844, 0.03351163864135742, 0.03472900390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 7.0, 2.0, 2.0, 3.0, 9.0, 6.0, 7.0, 13.0, 15.0, 14.0, 19.0, 35.0, 47.0, 58.0, 131.0, 157.0, 147.0, 119.0, 71.0, 42.0, 27.0, 15.0, 14.0, 9.0, 8.0, 10.0, 5.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005832672119140625, -0.005655527114868164, -0.005478382110595703, -0.005301237106323242, -0.005124092102050781, -0.00494694709777832, -0.004769802093505859, -0.0045926570892333984, -0.0044155120849609375, -0.0042383670806884766, -0.004061222076416016, -0.0038840770721435547, -0.0037069320678710938, -0.003529787063598633, -0.003352642059326172, -0.003175497055053711, -0.00299835205078125, -0.002821207046508789, -0.002644062042236328, -0.002466917037963867, -0.0022897720336914062, -0.0021126270294189453, -0.0019354820251464844, -0.0017583370208740234, -0.0015811920166015625, -0.0014040470123291016, -0.0012269020080566406, -0.0010497570037841797, -0.0008726119995117188, -0.0006954669952392578, -0.0005183219909667969, -0.00034117698669433594, -0.000164031982421875, 1.3113021850585938e-05, 0.00019025802612304688, 0.0003674030303955078, 0.0005445480346679688, 0.0007216930389404297, 0.0008988380432128906, 0.0010759830474853516, 0.0012531280517578125, 0.0014302730560302734, 0.0016074180603027344, 0.0017845630645751953, 0.0019617080688476562, 0.002138853073120117, 0.002315998077392578, 0.002493143081665039, 0.0026702880859375, 0.002847433090209961, 0.003024578094482422, 0.003201723098754883, 0.0033788681030273438, 0.0035560131072998047, 0.0037331581115722656, 0.0039103031158447266, 0.0040874481201171875, 0.0042645931243896484, 0.004441738128662109, 0.00461888313293457, 0.004796028137207031, 0.004973173141479492, 0.005150318145751953, 0.005327463150024414, 0.005504608154296875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 6.0, 11.0, 12.0, 22.0, 28.0, 53.0, 124.0, 177.0, 201.0, 155.0, 81.0, 51.0, 30.0, 16.0, 6.0, 6.0, 6.0, 3.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.0517942905426025, -2.969870090484619, -2.8879458904266357, -2.8060214519500732, -2.72409725189209, -2.6421730518341064, -2.560248851776123, -2.4783246517181396, -2.3964004516601562, -2.314476251602173, -2.2325520515441895, -2.150627613067627, -2.0687034130096436, -1.9867792129516602, -1.9048550128936768, -1.8229308128356934, -1.7410063743591309, -1.6590821743011475, -1.5771578550338745, -1.4952336549758911, -1.4133093357086182, -1.3313851356506348, -1.2494609355926514, -1.167536735534668, -1.085612416267395, -1.0036882162094116, -0.9217638969421387, -0.8398396968841553, -0.7579154372215271, -0.6759911775588989, -0.5940669775009155, -0.5121427178382874, -0.4302184581756592, -0.348294198513031, -0.2663699686527252, -0.18444572389125824, -0.10252147912979126, -0.020597219467163086, 0.0613270103931427, 0.1432512402534485, 0.22517549991607666, 0.30709975957870483, 0.3890239894390106, 0.4709482192993164, 0.5528724789619446, 0.6347967386245728, 0.7167209386825562, 0.7986451983451843, 0.8805694580078125, 0.9624937176704407, 1.0444179773330688, 1.1263421773910522, 1.2082664966583252, 1.2901906967163086, 1.372114896774292, 1.4540390968322754, 1.5359634160995483, 1.6178876161575317, 1.6998119354248047, 1.781736135482788, 1.8636603355407715, 1.9455846548080444, 2.0275089740753174, 2.109433174133301, 2.191357374191284]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 4.0, 10.0, 9.0, 9.0, 14.0, 24.0, 24.0, 39.0, 39.0, 71.0, 71.0, 74.0, 83.0, 84.0, 86.0, 76.0, 74.0, 45.0, 38.0, 34.0, 22.0, 19.0, 14.0, 4.0, 6.0, 8.0, 4.0, 1.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3675426244735718, -1.326404333114624, -1.2852660417556763, -1.244127869606018, -1.2029895782470703, -1.1618512868881226, -1.1207129955291748, -1.079574704170227, -1.0384364128112793, -0.9972981214523315, -0.9561598896980286, -0.9150215983390808, -0.8738833665847778, -0.8327450752258301, -0.7916067838668823, -0.7504684925079346, -0.7093303203582764, -0.6681920289993286, -0.6270537972450256, -0.5859155058860779, -0.5447772741317749, -0.5036389827728271, -0.4625006914138794, -0.42136242985725403, -0.38022416830062866, -0.3390859067440033, -0.29794764518737793, -0.2568093538284302, -0.2156710922718048, -0.17453283071517944, -0.13339455425739288, -0.09225627779960632, -0.05111813545227051, -0.009979866445064545, 0.03115840256214142, 0.07229667156934738, 0.11343494057655334, 0.1545732021331787, 0.19571147859096527, 0.23684975504875183, 0.2779880166053772, 0.31912627816200256, 0.36026453971862793, 0.4014028310775757, 0.44254109263420105, 0.4836793541908264, 0.5248176455497742, 0.5659558773040771, 0.6070941686630249, 0.6482324600219727, 0.6893706917762756, 0.7305089831352234, 0.7716472148895264, 0.8127855062484741, 0.8539237976074219, 0.8950620889663696, 0.9362003207206726, 0.9773386120796204, 1.0184768438339233, 1.059615135192871, 1.1007534265518188, 1.1418917179107666, 1.1830298900604248, 1.2241681814193726, 1.2653064727783203]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 5.0, 1.0, 2.0, 5.0, 13.0, 10.0, 17.0, 24.0, 37.0, 38.0, 71.0, 86.0, 159.0, 229.0, 400.0, 659.0, 1046.0, 2039.0, 4097.0, 8811.0, 21796.0, 70174.0, 638759.0, 227513.0, 43726.0, 15178.0, 6610.0, 3060.0, 1624.0, 912.0, 526.0, 326.0, 211.0, 111.0, 86.0, 57.0, 41.0, 30.0, 13.0, 14.0, 7.0, 11.0, 7.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.9228515625, -0.8908233642578125, -0.858795166015625, -0.8267669677734375, -0.79473876953125, -0.7627105712890625, -0.730682373046875, -0.6986541748046875, -0.6666259765625, -0.6345977783203125, -0.602569580078125, -0.5705413818359375, -0.53851318359375, -0.5064849853515625, -0.474456787109375, -0.4424285888671875, -0.410400390625, -0.3783721923828125, -0.346343994140625, -0.3143157958984375, -0.28228759765625, -0.2502593994140625, -0.218231201171875, -0.1862030029296875, -0.1541748046875, -0.1221466064453125, -0.090118408203125, -0.0580902099609375, -0.02606201171875, 0.0059661865234375, 0.037994384765625, 0.0700225830078125, 0.10205078125, 0.1340789794921875, 0.166107177734375, 0.1981353759765625, 0.23016357421875, 0.2621917724609375, 0.294219970703125, 0.3262481689453125, 0.3582763671875, 0.3903045654296875, 0.422332763671875, 0.4543609619140625, 0.48638916015625, 0.5184173583984375, 0.550445556640625, 0.5824737548828125, 0.614501953125, 0.6465301513671875, 0.678558349609375, 0.7105865478515625, 0.74261474609375, 0.7746429443359375, 0.806671142578125, 0.8386993408203125, 0.8707275390625, 0.9027557373046875, 0.934783935546875, 0.9668121337890625, 0.99884033203125, 1.0308685302734375, 1.062896728515625, 1.0949249267578125, 1.126953125]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 5.0, 7.0, 15.0, 11.0, 18.0, 16.0, 36.0, 38.0, 45.0, 63.0, 77.0, 74.0, 103.0, 93.0, 84.0, 71.0, 66.0, 41.0, 35.0, 25.0, 17.0, 12.0, 3.0, 13.0, 6.0, 2.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.583984375, -2.497406005859375, -2.41082763671875, -2.324249267578125, -2.2376708984375, -2.151092529296875, -2.06451416015625, -1.977935791015625, -1.891357421875, -1.804779052734375, -1.71820068359375, -1.631622314453125, -1.5450439453125, -1.458465576171875, -1.37188720703125, -1.285308837890625, -1.19873046875, -1.112152099609375, -1.02557373046875, -0.938995361328125, -0.8524169921875, -0.765838623046875, -0.67926025390625, -0.592681884765625, -0.506103515625, -0.419525146484375, -0.33294677734375, -0.246368408203125, -0.1597900390625, -0.073211669921875, 0.01336669921875, 0.099945068359375, 0.1865234375, 0.273101806640625, 0.35968017578125, 0.446258544921875, 0.5328369140625, 0.619415283203125, 0.70599365234375, 0.792572021484375, 0.879150390625, 0.965728759765625, 1.05230712890625, 1.138885498046875, 1.2254638671875, 1.312042236328125, 1.39862060546875, 1.485198974609375, 1.57177734375, 1.658355712890625, 1.74493408203125, 1.831512451171875, 1.9180908203125, 2.004669189453125, 2.09124755859375, 2.177825927734375, 2.264404296875, 2.350982666015625, 2.43756103515625, 2.524139404296875, 2.6107177734375, 2.697296142578125, 2.78387451171875, 2.870452880859375, 2.95703125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 9.0, 10.0, 13.0, 12.0, 18.0, 22.0, 27.0, 33.0, 53.0, 67.0, 95.0, 153.0, 218.0, 438.0, 1080.0, 3590.0, 18769.0, 205319.0, 775480.0, 34411.0, 5763.0, 1532.0, 562.0, 292.0, 162.0, 117.0, 77.0, 48.0, 50.0, 24.0, 22.0, 20.0, 17.0, 10.0, 9.0, 2.0, 4.0, 3.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-1.66796875, -1.6176605224609375, -1.567352294921875, -1.5170440673828125, -1.46673583984375, -1.4164276123046875, -1.366119384765625, -1.3158111572265625, -1.2655029296875, -1.2151947021484375, -1.164886474609375, -1.1145782470703125, -1.06427001953125, -1.0139617919921875, -0.963653564453125, -0.9133453369140625, -0.863037109375, -0.8127288818359375, -0.762420654296875, -0.7121124267578125, -0.66180419921875, -0.6114959716796875, -0.561187744140625, -0.5108795166015625, -0.4605712890625, -0.4102630615234375, -0.359954833984375, -0.3096466064453125, -0.25933837890625, -0.2090301513671875, -0.158721923828125, -0.1084136962890625, -0.05810546875, -0.0077972412109375, 0.042510986328125, 0.0928192138671875, 0.14312744140625, 0.1934356689453125, 0.243743896484375, 0.2940521240234375, 0.3443603515625, 0.3946685791015625, 0.444976806640625, 0.4952850341796875, 0.54559326171875, 0.5959014892578125, 0.646209716796875, 0.6965179443359375, 0.746826171875, 0.7971343994140625, 0.847442626953125, 0.8977508544921875, 0.94805908203125, 0.9983673095703125, 1.048675537109375, 1.0989837646484375, 1.1492919921875, 1.1996002197265625, 1.249908447265625, 1.3002166748046875, 1.35052490234375, 1.4008331298828125, 1.451141357421875, 1.5014495849609375, 1.5517578125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 2.0, 4.0, 6.0, 6.0, 3.0, 15.0, 9.0, 12.0, 18.0, 12.0, 21.0, 26.0, 36.0, 43.0, 35.0, 30.0, 45.0, 45.0, 51.0, 35.0, 56.0, 56.0, 44.0, 44.0, 46.0, 45.0, 36.0, 32.0, 41.0, 21.0, 20.0, 22.0, 19.0, 9.0, 10.0, 9.0, 9.0, 12.0, 6.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.5, -2.433624267578125, -2.36724853515625, -2.300872802734375, -2.2344970703125, -2.168121337890625, -2.10174560546875, -2.035369873046875, -1.968994140625, -1.902618408203125, -1.83624267578125, -1.769866943359375, -1.7034912109375, -1.637115478515625, -1.57073974609375, -1.504364013671875, -1.43798828125, -1.371612548828125, -1.30523681640625, -1.238861083984375, -1.1724853515625, -1.106109619140625, -1.03973388671875, -0.973358154296875, -0.906982421875, -0.840606689453125, -0.77423095703125, -0.707855224609375, -0.6414794921875, -0.575103759765625, -0.50872802734375, -0.442352294921875, -0.3759765625, -0.309600830078125, -0.24322509765625, -0.176849365234375, -0.1104736328125, -0.044097900390625, 0.02227783203125, 0.088653564453125, 0.155029296875, 0.221405029296875, 0.28778076171875, 0.354156494140625, 0.4205322265625, 0.486907958984375, 0.55328369140625, 0.619659423828125, 0.68603515625, 0.752410888671875, 0.81878662109375, 0.885162353515625, 0.9515380859375, 1.017913818359375, 1.08428955078125, 1.150665283203125, 1.217041015625, 1.283416748046875, 1.34979248046875, 1.416168212890625, 1.4825439453125, 1.548919677734375, 1.61529541015625, 1.681671142578125, 1.748046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 6.0, 17.0, 16.0, 19.0, 38.0, 56.0, 96.0, 253.0, 569.0, 1555.0, 5156.0, 22908.0, 169040.0, 792822.0, 43669.0, 8468.0, 2340.0, 839.0, 331.0, 120.0, 80.0, 48.0, 24.0, 19.0, 12.0, 13.0, 11.0, 5.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.689453125, -0.6673431396484375, -0.645233154296875, -0.6231231689453125, -0.60101318359375, -0.5789031982421875, -0.556793212890625, -0.5346832275390625, -0.5125732421875, -0.4904632568359375, -0.468353271484375, -0.4462432861328125, -0.42413330078125, -0.4020233154296875, -0.379913330078125, -0.3578033447265625, -0.335693359375, -0.3135833740234375, -0.291473388671875, -0.2693634033203125, -0.24725341796875, -0.2251434326171875, -0.203033447265625, -0.1809234619140625, -0.1588134765625, -0.1367034912109375, -0.114593505859375, -0.0924835205078125, -0.07037353515625, -0.0482635498046875, -0.026153564453125, -0.0040435791015625, 0.01806640625, 0.0401763916015625, 0.062286376953125, 0.0843963623046875, 0.10650634765625, 0.1286163330078125, 0.150726318359375, 0.1728363037109375, 0.1949462890625, 0.2170562744140625, 0.239166259765625, 0.2612762451171875, 0.28338623046875, 0.3054962158203125, 0.327606201171875, 0.3497161865234375, 0.371826171875, 0.3939361572265625, 0.416046142578125, 0.4381561279296875, 0.46026611328125, 0.4823760986328125, 0.504486083984375, 0.5265960693359375, 0.5487060546875, 0.5708160400390625, 0.592926025390625, 0.6150360107421875, 0.63714599609375, 0.6592559814453125, 0.681365966796875, 0.7034759521484375, 0.7255859375]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 4.0, 0.0, 6.0, 7.0, 2.0, 6.0, 7.0, 10.0, 7.0, 17.0, 16.0, 23.0, 20.0, 29.0, 53.0, 114.0, 322.0, 160.0, 45.0, 32.0, 40.0, 16.0, 13.0, 16.0, 11.0, 12.0, 7.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00010305643081665039, -0.00010038726031780243, -9.771808981895447e-05, -9.50489193201065e-05, -9.237974882125854e-05, -8.971057832241058e-05, -8.704140782356262e-05, -8.437223732471466e-05, -8.17030668258667e-05, -7.903389632701874e-05, -7.636472582817078e-05, -7.369555532932281e-05, -7.102638483047485e-05, -6.835721433162689e-05, -6.568804383277893e-05, -6.301887333393097e-05, -6.034970283508301e-05, -5.7680532336235046e-05, -5.5011361837387085e-05, -5.2342191338539124e-05, -4.967302083969116e-05, -4.70038503408432e-05, -4.433467984199524e-05, -4.166550934314728e-05, -3.8996338844299316e-05, -3.6327168345451355e-05, -3.3657997846603394e-05, -3.098882734775543e-05, -2.831965684890747e-05, -2.565048635005951e-05, -2.2981315851211548e-05, -2.0312145352363586e-05, -1.7642974853515625e-05, -1.4973804354667664e-05, -1.2304633855819702e-05, -9.63546335697174e-06, -6.966292858123779e-06, -4.297122359275818e-06, -1.6279518604278564e-06, 1.041218638420105e-06, 3.7103891372680664e-06, 6.379559636116028e-06, 9.04873013496399e-06, 1.171790063381195e-05, 1.4387071132659912e-05, 1.7056241631507874e-05, 1.9725412130355835e-05, 2.2394582629203796e-05, 2.5063753128051758e-05, 2.773292362689972e-05, 3.040209412574768e-05, 3.307126462459564e-05, 3.5740435123443604e-05, 3.8409605622291565e-05, 4.1078776121139526e-05, 4.374794661998749e-05, 4.641711711883545e-05, 4.908628761768341e-05, 5.175545811653137e-05, 5.4424628615379333e-05, 5.7093799114227295e-05, 5.9762969613075256e-05, 6.243214011192322e-05, 6.510131061077118e-05, 6.777048110961914e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 7.0, 2.0, 17.0, 12.0, 15.0, 35.0, 53.0, 69.0, 138.0, 206.0, 380.0, 730.0, 1695.0, 4364.0, 14559.0, 60658.0, 748403.0, 170576.0, 32578.0, 8745.0, 2832.0, 1145.0, 563.0, 301.0, 148.0, 97.0, 71.0, 46.0, 33.0, 24.0, 8.0, 11.0, 14.0, 10.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56689453125, -0.5490646362304688, -0.5312347412109375, -0.5134048461914062, -0.495574951171875, -0.47774505615234375, -0.4599151611328125, -0.44208526611328125, -0.42425537109375, -0.40642547607421875, -0.3885955810546875, -0.37076568603515625, -0.352935791015625, -0.33510589599609375, -0.3172760009765625, -0.29944610595703125, -0.2816162109375, -0.26378631591796875, -0.2459564208984375, -0.22812652587890625, -0.210296630859375, -0.19246673583984375, -0.1746368408203125, -0.15680694580078125, -0.13897705078125, -0.12114715576171875, -0.1033172607421875, -0.08548736572265625, -0.067657470703125, -0.04982757568359375, -0.0319976806640625, -0.01416778564453125, 0.003662109375, 0.02149200439453125, 0.0393218994140625, 0.05715179443359375, 0.074981689453125, 0.09281158447265625, 0.1106414794921875, 0.12847137451171875, 0.14630126953125, 0.16413116455078125, 0.1819610595703125, 0.19979095458984375, 0.217620849609375, 0.23545074462890625, 0.2532806396484375, 0.27111053466796875, 0.2889404296875, 0.30677032470703125, 0.3246002197265625, 0.34243011474609375, 0.360260009765625, 0.37808990478515625, 0.3959197998046875, 0.41374969482421875, 0.43157958984375, 0.44940948486328125, 0.4672393798828125, 0.48506927490234375, 0.502899169921875, 0.5207290649414062, 0.5385589599609375, 0.5563888549804688, 0.57421875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 1.0, 4.0, 6.0, 5.0, 8.0, 11.0, 15.0, 10.0, 31.0, 31.0, 23.0, 42.0, 50.0, 115.0, 375.0, 73.0, 46.0, 34.0, 27.0, 18.0, 18.0, 9.0, 15.0, 9.0, 5.0, 3.0, 6.0, 4.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25048828125, -0.24358558654785156, -0.23668289184570312, -0.2297801971435547, -0.22287750244140625, -0.2159748077392578, -0.20907211303710938, -0.20216941833496094, -0.1952667236328125, -0.18836402893066406, -0.18146133422851562, -0.1745586395263672, -0.16765594482421875, -0.1607532501220703, -0.15385055541992188, -0.14694786071777344, -0.140045166015625, -0.13314247131347656, -0.12623977661132812, -0.11933708190917969, -0.11243438720703125, -0.10553169250488281, -0.09862899780273438, -0.09172630310058594, -0.0848236083984375, -0.07792091369628906, -0.07101821899414062, -0.06411552429199219, -0.05721282958984375, -0.05031013488769531, -0.043407440185546875, -0.03650474548339844, -0.02960205078125, -0.022699356079101562, -0.015796661376953125, -0.008893966674804688, -0.00199127197265625, 0.0049114227294921875, 0.011814117431640625, 0.018716812133789062, 0.0256195068359375, 0.03252220153808594, 0.039424896240234375, 0.04632759094238281, 0.05323028564453125, 0.06013298034667969, 0.06703567504882812, 0.07393836975097656, 0.080841064453125, 0.08774375915527344, 0.09464645385742188, 0.10154914855957031, 0.10845184326171875, 0.11535453796386719, 0.12225723266601562, 0.12915992736816406, 0.1360626220703125, 0.14296531677246094, 0.14986801147460938, 0.1567707061767578, 0.16367340087890625, 0.1705760955810547, 0.17747879028320312, 0.18438148498535156, 0.1912841796875]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 6.0, 11.0, 19.0, 19.0, 16.0, 49.0, 82.0, 106.0, 168.0, 128.0, 135.0, 86.0, 50.0, 44.0, 18.0, 15.0, 6.0, 2.0, 7.0, 4.0, 8.0, 2.0, 1.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.19025993347168, -4.055255889892578, -3.9202523231506348, -3.7852485179901123, -3.65024471282959, -3.5152406692504883, -3.380236864089966, -3.2452330589294434, -3.110229253768921, -2.9752254486083984, -2.840221643447876, -2.7052178382873535, -2.570213794708252, -2.4352102279663086, -2.300206184387207, -2.1652023792266846, -2.030198574066162, -1.8951947689056396, -1.7601909637451172, -1.6251870393753052, -1.4901832342147827, -1.3551794290542603, -1.2201755046844482, -1.0851716995239258, -0.9501678943634033, -0.8151640892028809, -0.6801602244377136, -0.5451563596725464, -0.4101525545120239, -0.27514874935150146, -0.14014488458633423, -0.005141019821166992, 0.12986278533935547, 0.2648666203022003, 0.39987045526504517, 0.5348743200302124, 0.6698781251907349, 0.8048819303512573, 0.9398857951164246, 1.0748896598815918, 1.2098934650421143, 1.3448972702026367, 1.4799010753631592, 1.6149049997329712, 1.7499088048934937, 1.8849126100540161, 2.019916534423828, 2.1549203395843506, 2.289924144744873, 2.4249279499053955, 2.559931755065918, 2.6949355602264404, 2.829939365386963, 2.9649434089660645, 3.099947214126587, 3.2349510192871094, 3.369954824447632, 3.5049586296081543, 3.6399624347686768, 3.774966239929199, 3.909970283508301, 4.044973850250244, 4.179977893829346, 4.314981460571289, 4.449985504150391]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 7.0, 10.0, 7.0, 8.0, 8.0, 10.0, 11.0, 14.0, 17.0, 13.0, 22.0, 27.0, 21.0, 31.0, 38.0, 37.0, 45.0, 39.0, 46.0, 43.0, 40.0, 35.0, 43.0, 45.0, 42.0, 45.0, 27.0, 23.0, 38.0, 30.0, 27.0, 26.0, 22.0, 17.0, 16.0, 12.0, 10.0, 16.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.383150815963745, -3.276851177215576, -3.1705517768859863, -3.0642521381378174, -2.9579524993896484, -2.8516530990600586, -2.7453534603118896, -2.6390538215637207, -2.532754421234131, -2.426454782485962, -2.320155382156372, -2.213855743408203, -2.107556104660034, -2.0012564659118652, -1.8949570655822754, -1.7886574268341064, -1.6823577880859375, -1.576058268547058, -1.4697586297988892, -1.3634591102600098, -1.2571594715118408, -1.1508599519729614, -1.044560432434082, -0.9382608532905579, -0.8319612741470337, -0.7256616950035095, -0.6193621158599854, -0.513062596321106, -0.4067630171775818, -0.3004634380340576, -0.19416391849517822, -0.08786433935165405, 0.01843547821044922, 0.1247350424528122, 0.23103460669517517, 0.33733415603637695, 0.4436337351799011, 0.5499333143234253, 0.6562328338623047, 0.7625324130058289, 0.868831992149353, 0.9751315712928772, 1.0814311504364014, 1.1877306699752808, 1.2940301895141602, 1.400329828262329, 1.5066293478012085, 1.612928867340088, 1.7192285060882568, 1.8255280256271362, 1.9318276643753052, 2.0381271839141846, 2.1444268226623535, 2.2507262229919434, 2.3570258617401123, 2.4633255004882812, 2.569624900817871, 2.67592453956604, 2.78222393989563, 2.888523578643799, 2.9948232173919678, 3.1011228561401367, 3.2074222564697266, 3.3137218952178955, 3.4200215339660645]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 4.0, 2.0, 4.0, 3.0, 9.0, 5.0, 9.0, 8.0, 16.0, 29.0, 31.0, 57.0, 71.0, 93.0, 166.0, 293.0, 447.0, 815.0, 1592.0, 3950.0, 11213.0, 46311.0, 500689.0, 3438684.0, 152197.0, 24847.0, 7064.0, 2714.0, 1295.0, 605.0, 376.0, 240.0, 134.0, 70.0, 66.0, 43.0, 35.0, 32.0, 19.0, 16.0, 11.0, 8.0, 2.0, 1.0, 5.0, 2.0, 5.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.26171875, -2.191680908203125, -2.12164306640625, -2.051605224609375, -1.9815673828125, -1.911529541015625, -1.84149169921875, -1.771453857421875, -1.701416015625, -1.631378173828125, -1.56134033203125, -1.491302490234375, -1.4212646484375, -1.351226806640625, -1.28118896484375, -1.211151123046875, -1.14111328125, -1.071075439453125, -1.00103759765625, -0.930999755859375, -0.8609619140625, -0.790924072265625, -0.72088623046875, -0.650848388671875, -0.580810546875, -0.510772705078125, -0.44073486328125, -0.370697021484375, -0.3006591796875, -0.230621337890625, -0.16058349609375, -0.090545654296875, -0.0205078125, 0.049530029296875, 0.11956787109375, 0.189605712890625, 0.2596435546875, 0.329681396484375, 0.39971923828125, 0.469757080078125, 0.539794921875, 0.609832763671875, 0.67987060546875, 0.749908447265625, 0.8199462890625, 0.889984130859375, 0.96002197265625, 1.030059814453125, 1.10009765625, 1.170135498046875, 1.24017333984375, 1.310211181640625, 1.3802490234375, 1.450286865234375, 1.52032470703125, 1.590362548828125, 1.660400390625, 1.730438232421875, 1.80047607421875, 1.870513916015625, 1.9405517578125, 2.010589599609375, 2.08062744140625, 2.150665283203125, 2.220703125]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 5.0, 9.0, 10.0, 11.0, 19.0, 30.0, 41.0, 47.0, 67.0, 66.0, 93.0, 95.0, 127.0, 105.0, 78.0, 59.0, 42.0, 26.0, 19.0, 8.0, 9.0, 10.0, 7.0, 8.0, 1.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.037109375, -1.9802093505859375, -1.923309326171875, -1.8664093017578125, -1.80950927734375, -1.7526092529296875, -1.695709228515625, -1.6388092041015625, -1.5819091796875, -1.5250091552734375, -1.468109130859375, -1.4112091064453125, -1.35430908203125, -1.2974090576171875, -1.240509033203125, -1.1836090087890625, -1.126708984375, -1.0698089599609375, -1.012908935546875, -0.9560089111328125, -0.89910888671875, -0.8422088623046875, -0.785308837890625, -0.7284088134765625, -0.6715087890625, -0.6146087646484375, -0.557708740234375, -0.5008087158203125, -0.44390869140625, -0.3870086669921875, -0.330108642578125, -0.2732086181640625, -0.21630859375, -0.1594085693359375, -0.102508544921875, -0.0456085205078125, 0.01129150390625, 0.0681915283203125, 0.125091552734375, 0.1819915771484375, 0.2388916015625, 0.2957916259765625, 0.352691650390625, 0.4095916748046875, 0.46649169921875, 0.5233917236328125, 0.580291748046875, 0.6371917724609375, 0.694091796875, 0.7509918212890625, 0.807891845703125, 0.8647918701171875, 0.92169189453125, 0.9785919189453125, 1.035491943359375, 1.0923919677734375, 1.1492919921875, 1.2061920166015625, 1.263092041015625, 1.3199920654296875, 1.37689208984375, 1.4337921142578125, 1.490692138671875, 1.5475921630859375, 1.6044921875]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 11.0, 22.0, 31.0, 43.0, 83.0, 155.0, 270.0, 575.0, 1664.0, 5772.0, 33430.0, 671844.0, 3392001.0, 74528.0, 9807.0, 2444.0, 822.0, 353.0, 160.0, 86.0, 55.0, 34.0, 24.0, 16.0, 8.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.259765625, -3.158447265625, -3.05712890625, -2.955810546875, -2.8544921875, -2.753173828125, -2.65185546875, -2.550537109375, -2.44921875, -2.347900390625, -2.24658203125, -2.145263671875, -2.0439453125, -1.942626953125, -1.84130859375, -1.739990234375, -1.638671875, -1.537353515625, -1.43603515625, -1.334716796875, -1.2333984375, -1.132080078125, -1.03076171875, -0.929443359375, -0.828125, -0.726806640625, -0.62548828125, -0.524169921875, -0.4228515625, -0.321533203125, -0.22021484375, -0.118896484375, -0.017578125, 0.083740234375, 0.18505859375, 0.286376953125, 0.3876953125, 0.489013671875, 0.59033203125, 0.691650390625, 0.79296875, 0.894287109375, 0.99560546875, 1.096923828125, 1.1982421875, 1.299560546875, 1.40087890625, 1.502197265625, 1.603515625, 1.704833984375, 1.80615234375, 1.907470703125, 2.0087890625, 2.110107421875, 2.21142578125, 2.312744140625, 2.4140625, 2.515380859375, 2.61669921875, 2.718017578125, 2.8193359375, 2.920654296875, 3.02197265625, 3.123291015625, 3.224609375]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 3.0, 5.0, 4.0, 6.0, 8.0, 9.0, 20.0, 9.0, 21.0, 25.0, 41.0, 57.0, 56.0, 118.0, 184.0, 310.0, 518.0, 1033.0, 643.0, 350.0, 195.0, 147.0, 92.0, 51.0, 47.0, 33.0, 28.0, 15.0, 11.0, 11.0, 6.0, 11.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4501953125, -0.43193817138671875, -0.4136810302734375, -0.39542388916015625, -0.377166748046875, -0.35890960693359375, -0.3406524658203125, -0.32239532470703125, -0.30413818359375, -0.28588104248046875, -0.2676239013671875, -0.24936676025390625, -0.231109619140625, -0.21285247802734375, -0.1945953369140625, -0.17633819580078125, -0.1580810546875, -0.13982391357421875, -0.1215667724609375, -0.10330963134765625, -0.085052490234375, -0.06679534912109375, -0.0485382080078125, -0.03028106689453125, -0.01202392578125, 0.00623321533203125, 0.0244903564453125, 0.04274749755859375, 0.061004638671875, 0.07926177978515625, 0.0975189208984375, 0.11577606201171875, 0.134033203125, 0.15229034423828125, 0.1705474853515625, 0.18880462646484375, 0.207061767578125, 0.22531890869140625, 0.2435760498046875, 0.26183319091796875, 0.28009033203125, 0.29834747314453125, 0.3166046142578125, 0.33486175537109375, 0.353118896484375, 0.37137603759765625, 0.3896331787109375, 0.40789031982421875, 0.4261474609375, 0.44440460205078125, 0.4626617431640625, 0.48091888427734375, 0.499176025390625, 0.5174331665039062, 0.5356903076171875, 0.5539474487304688, 0.57220458984375, 0.5904617309570312, 0.6087188720703125, 0.6269760131835938, 0.645233154296875, 0.6634902954101562, 0.6817474365234375, 0.7000045776367188, 0.71826171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 4.0, 7.0, 12.0, 13.0, 20.0, 25.0, 35.0, 50.0, 73.0, 111.0, 134.0, 140.0, 113.0, 78.0, 58.0, 46.0, 24.0, 22.0, 16.0, 3.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.032090187072754, -2.9403839111328125, -2.848677396774292, -2.7569708824157715, -2.66526460647583, -2.5735583305358887, -2.481851816177368, -2.3901453018188477, -2.2984390258789062, -2.206732749938965, -2.1150262355804443, -2.023319721221924, -1.9316134452819824, -1.8399070501327515, -1.7482006549835205, -1.6564942598342896, -1.5647878646850586, -1.4730814695358276, -1.3813750743865967, -1.2896686792373657, -1.1979622840881348, -1.1062558889389038, -1.0145494937896729, -0.9228430986404419, -0.8311367034912109, -0.73943030834198, -0.647723913192749, -0.5560175180435181, -0.4643111228942871, -0.37260472774505615, -0.2808983325958252, -0.18919193744659424, -0.09748530387878418, -0.005778908729553223, 0.08592748641967773, 0.1776338815689087, 0.26934027671813965, 0.3610466718673706, 0.45275306701660156, 0.5444594621658325, 0.6361658573150635, 0.7278722524642944, 0.8195786476135254, 0.9112850427627563, 1.0029914379119873, 1.0946978330612183, 1.1864042282104492, 1.2781106233596802, 1.3698170185089111, 1.461523413658142, 1.553229808807373, 1.644936203956604, 1.736642599105835, 1.828348994255066, 1.9200553894042969, 2.0117616653442383, 2.103468179702759, 2.1951746940612793, 2.2868809700012207, 2.378587245941162, 2.4702937602996826, 2.562000274658203, 2.6537065505981445, 2.745412826538086, 2.8371193408966064]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 4.0, 4.0, 14.0, 16.0, 22.0, 21.0, 30.0, 17.0, 32.0, 36.0, 58.0, 69.0, 64.0, 68.0, 74.0, 61.0, 55.0, 66.0, 42.0, 31.0, 38.0, 37.0, 23.0, 21.0, 21.0, 15.0, 8.0, 13.0, 7.0, 5.0, 7.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5928623676300049, -1.5402166843414307, -1.487571120262146, -1.4349255561828613, -1.382279872894287, -1.329634189605713, -1.2769886255264282, -1.2243430614471436, -1.1716973781585693, -1.1190516948699951, -1.0664061307907104, -1.0137605667114258, -0.9611148834228516, -0.9084692597389221, -0.8558236360549927, -0.8031780123710632, -0.7505323886871338, -0.6978867650032043, -0.6452411413192749, -0.5925955176353455, -0.539949893951416, -0.4873042702674866, -0.43465864658355713, -0.3820130228996277, -0.32936739921569824, -0.2767217755317688, -0.22407615184783936, -0.1714305281639099, -0.11878490447998047, -0.06613928079605103, -0.013493657112121582, 0.03915196657180786, 0.0917975902557373, 0.14444321393966675, 0.1970888376235962, 0.24973446130752563, 0.3023800849914551, 0.3550257086753845, 0.40767133235931396, 0.4603169560432434, 0.5129625797271729, 0.5656082034111023, 0.6182538270950317, 0.6708994507789612, 0.7235450744628906, 0.7761906981468201, 0.8288363218307495, 0.881481945514679, 0.9341275691986084, 0.9867731928825378, 1.0394188165664673, 1.092064380645752, 1.1447100639343262, 1.1973557472229004, 1.250001311302185, 1.3026468753814697, 1.355292558670044, 1.4079382419586182, 1.4605838060379028, 1.5132293701171875, 1.5658750534057617, 1.618520736694336, 1.6711663007736206, 1.7238118648529053, 1.7764575481414795]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 4.0, 3.0, 7.0, 11.0, 9.0, 11.0, 15.0, 20.0, 27.0, 28.0, 43.0, 76.0, 98.0, 136.0, 208.0, 284.0, 466.0, 797.0, 1557.0, 4106.0, 16967.0, 159247.0, 772805.0, 74705.0, 10614.0, 3060.0, 1274.0, 678.0, 417.0, 239.0, 180.0, 111.0, 90.0, 72.0, 35.0, 38.0, 28.0, 15.0, 10.0, 22.0, 5.0, 10.0, 4.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.296630859375, -0.2874641418457031, -0.27829742431640625, -0.2691307067871094, -0.2599639892578125, -0.2507972717285156, -0.24163055419921875, -0.23246383666992188, -0.223297119140625, -0.21413040161132812, -0.20496368408203125, -0.19579696655273438, -0.1866302490234375, -0.17746353149414062, -0.16829681396484375, -0.15913009643554688, -0.14996337890625, -0.14079666137695312, -0.13162994384765625, -0.12246322631835938, -0.1132965087890625, -0.10412979125976562, -0.09496307373046875, -0.08579635620117188, -0.076629638671875, -0.06746292114257812, -0.05829620361328125, -0.049129486083984375, -0.0399627685546875, -0.030796051025390625, -0.02162933349609375, -0.012462615966796875, -0.0032958984375, 0.005870819091796875, 0.01503753662109375, 0.024204254150390625, 0.0333709716796875, 0.042537689208984375, 0.05170440673828125, 0.060871124267578125, 0.070037841796875, 0.07920455932617188, 0.08837127685546875, 0.09753799438476562, 0.1067047119140625, 0.11587142944335938, 0.12503814697265625, 0.13420486450195312, 0.14337158203125, 0.15253829956054688, 0.16170501708984375, 0.17087173461914062, 0.1800384521484375, 0.18920516967773438, 0.19837188720703125, 0.20753860473632812, 0.216705322265625, 0.22587203979492188, 0.23503875732421875, 0.24420547485351562, 0.2533721923828125, 0.2625389099121094, 0.27170562744140625, 0.2808723449707031, 0.2900390625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 8.0, 5.0, 13.0, 14.0, 21.0, 25.0, 17.0, 43.0, 37.0, 39.0, 52.0, 70.0, 75.0, 62.0, 90.0, 59.0, 52.0, 57.0, 50.0, 37.0, 32.0, 33.0, 17.0, 24.0, 11.0, 22.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.361328125, -1.3186798095703125, -1.276031494140625, -1.2333831787109375, -1.19073486328125, -1.1480865478515625, -1.105438232421875, -1.0627899169921875, -1.0201416015625, -0.9774932861328125, -0.934844970703125, -0.8921966552734375, -0.84954833984375, -0.8069000244140625, -0.764251708984375, -0.7216033935546875, -0.678955078125, -0.6363067626953125, -0.593658447265625, -0.5510101318359375, -0.50836181640625, -0.4657135009765625, -0.423065185546875, -0.3804168701171875, -0.3377685546875, -0.2951202392578125, -0.252471923828125, -0.2098236083984375, -0.16717529296875, -0.1245269775390625, -0.081878662109375, -0.0392303466796875, 0.00341796875, 0.0460662841796875, 0.088714599609375, 0.1313629150390625, 0.17401123046875, 0.2166595458984375, 0.259307861328125, 0.3019561767578125, 0.3446044921875, 0.3872528076171875, 0.429901123046875, 0.4725494384765625, 0.51519775390625, 0.5578460693359375, 0.600494384765625, 0.6431427001953125, 0.685791015625, 0.7284393310546875, 0.771087646484375, 0.8137359619140625, 0.85638427734375, 0.8990325927734375, 0.941680908203125, 0.9843292236328125, 1.0269775390625, 1.0696258544921875, 1.112274169921875, 1.1549224853515625, 1.19757080078125, 1.2402191162109375, 1.282867431640625, 1.3255157470703125, 1.3681640625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 9.0, 4.0, 2.0, 7.0, 10.0, 17.0, 15.0, 32.0, 36.0, 49.0, 58.0, 95.0, 116.0, 154.0, 177.0, 294.0, 478.0, 1114.0, 3987.0, 26658.0, 320669.0, 628391.0, 55795.0, 7109.0, 1481.0, 541.0, 362.0, 238.0, 167.0, 127.0, 90.0, 67.0, 47.0, 41.0, 21.0, 24.0, 16.0, 13.0, 13.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.199462890625, -0.19344711303710938, -0.18743133544921875, -0.18141555786132812, -0.1753997802734375, -0.16938400268554688, -0.16336822509765625, -0.15735244750976562, -0.151336669921875, -0.14532089233398438, -0.13930511474609375, -0.13328933715820312, -0.1272735595703125, -0.12125778198242188, -0.11524200439453125, -0.10922622680664062, -0.10321044921875, -0.09719467163085938, -0.09117889404296875, -0.08516311645507812, -0.0791473388671875, -0.07313156127929688, -0.06711578369140625, -0.061100006103515625, -0.055084228515625, -0.049068450927734375, -0.04305267333984375, -0.037036895751953125, -0.0310211181640625, -0.025005340576171875, -0.01898956298828125, -0.012973785400390625, -0.0069580078125, -0.000942230224609375, 0.00507354736328125, 0.011089324951171875, 0.0171051025390625, 0.023120880126953125, 0.02913665771484375, 0.035152435302734375, 0.041168212890625, 0.047183990478515625, 0.05319976806640625, 0.059215545654296875, 0.0652313232421875, 0.07124710083007812, 0.07726287841796875, 0.08327865600585938, 0.08929443359375, 0.09531021118164062, 0.10132598876953125, 0.10734176635742188, 0.1133575439453125, 0.11937332153320312, 0.12538909912109375, 0.13140487670898438, 0.137420654296875, 0.14343643188476562, 0.14945220947265625, 0.15546798706054688, 0.1614837646484375, 0.16749954223632812, 0.17351531982421875, 0.17953109741210938, 0.185546875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 1.0, 8.0, 4.0, 3.0, 6.0, 9.0, 13.0, 12.0, 8.0, 21.0, 21.0, 18.0, 27.0, 27.0, 36.0, 32.0, 48.0, 37.0, 51.0, 49.0, 64.0, 49.0, 52.0, 45.0, 41.0, 46.0, 40.0, 33.0, 35.0, 29.0, 21.0, 20.0, 16.0, 12.0, 12.0, 10.0, 14.0, 8.0, 8.0, 6.0, 5.0, 6.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.060546875, -1.998077392578125, -1.93560791015625, -1.873138427734375, -1.8106689453125, -1.748199462890625, -1.68572998046875, -1.623260498046875, -1.560791015625, -1.498321533203125, -1.43585205078125, -1.373382568359375, -1.3109130859375, -1.248443603515625, -1.18597412109375, -1.123504638671875, -1.06103515625, -0.998565673828125, -0.93609619140625, -0.873626708984375, -0.8111572265625, -0.748687744140625, -0.68621826171875, -0.623748779296875, -0.561279296875, -0.498809814453125, -0.43634033203125, -0.373870849609375, -0.3114013671875, -0.248931884765625, -0.18646240234375, -0.123992919921875, -0.0615234375, 0.000946044921875, 0.06341552734375, 0.125885009765625, 0.1883544921875, 0.250823974609375, 0.31329345703125, 0.375762939453125, 0.438232421875, 0.500701904296875, 0.56317138671875, 0.625640869140625, 0.6881103515625, 0.750579833984375, 0.81304931640625, 0.875518798828125, 0.93798828125, 1.000457763671875, 1.06292724609375, 1.125396728515625, 1.1878662109375, 1.250335693359375, 1.31280517578125, 1.375274658203125, 1.437744140625, 1.500213623046875, 1.56268310546875, 1.625152587890625, 1.6876220703125, 1.750091552734375, 1.81256103515625, 1.875030517578125, 1.9375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 8.0, 6.0, 7.0, 8.0, 5.0, 16.0, 26.0, 21.0, 34.0, 50.0, 57.0, 104.0, 144.0, 211.0, 293.0, 565.0, 1534.0, 8860.0, 327653.0, 692176.0, 13266.0, 1858.0, 638.0, 358.0, 189.0, 134.0, 91.0, 68.0, 52.0, 34.0, 24.0, 21.0, 12.0, 9.0, 10.0, 5.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.040191650390625, -0.03904581069946289, -0.03789997100830078, -0.03675413131713867, -0.03560829162597656, -0.03446245193481445, -0.033316612243652344, -0.032170772552490234, -0.031024932861328125, -0.029879093170166016, -0.028733253479003906, -0.027587413787841797, -0.026441574096679688, -0.025295734405517578, -0.02414989471435547, -0.02300405502319336, -0.02185821533203125, -0.02071237564086914, -0.01956653594970703, -0.018420696258544922, -0.017274856567382812, -0.016129016876220703, -0.014983177185058594, -0.013837337493896484, -0.012691497802734375, -0.011545658111572266, -0.010399818420410156, -0.009253978729248047, -0.008108139038085938, -0.006962299346923828, -0.005816459655761719, -0.004670619964599609, -0.0035247802734375, -0.0023789405822753906, -0.0012331008911132812, -8.726119995117188e-05, 0.0010585784912109375, 0.002204418182373047, 0.0033502578735351562, 0.004496097564697266, 0.005641937255859375, 0.006787776947021484, 0.007933616638183594, 0.009079456329345703, 0.010225296020507812, 0.011371135711669922, 0.012516975402832031, 0.01366281509399414, 0.01480865478515625, 0.01595449447631836, 0.01710033416748047, 0.018246173858642578, 0.019392013549804688, 0.020537853240966797, 0.021683692932128906, 0.022829532623291016, 0.023975372314453125, 0.025121212005615234, 0.026267051696777344, 0.027412891387939453, 0.028558731079101562, 0.029704570770263672, 0.03085041046142578, 0.03199625015258789, 0.03314208984375]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 4.0, 6.0, 10.0, 22.0, 36.0, 54.0, 65.0, 88.0, 126.0, 123.0, 106.0, 113.0, 72.0, 55.0, 35.0, 22.0, 17.0, 11.0, 10.0, 6.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.895427703857422e-05, -1.8392689526081085e-05, -1.783110201358795e-05, -1.7269514501094818e-05, -1.6707926988601685e-05, -1.614633947610855e-05, -1.5584751963615417e-05, -1.5023164451122284e-05, -1.446157693862915e-05, -1.3899989426136017e-05, -1.3338401913642883e-05, -1.277681440114975e-05, -1.2215226888656616e-05, -1.1653639376163483e-05, -1.1092051863670349e-05, -1.0530464351177216e-05, -9.968876838684082e-06, -9.407289326190948e-06, -8.845701813697815e-06, -8.284114301204681e-06, -7.722526788711548e-06, -7.160939276218414e-06, -6.599351763725281e-06, -6.037764251232147e-06, -5.476176738739014e-06, -4.91458922624588e-06, -4.353001713752747e-06, -3.791414201259613e-06, -3.2298266887664795e-06, -2.668239176273346e-06, -2.1066516637802124e-06, -1.5450641512870789e-06, -9.834766387939453e-07, -4.2188912630081177e-07, 1.3969838619232178e-07, 7.012858986854553e-07, 1.2628734111785889e-06, 1.8244609236717224e-06, 2.386048436164856e-06, 2.9476359486579895e-06, 3.509223461151123e-06, 4.070810973644257e-06, 4.63239848613739e-06, 5.193985998630524e-06, 5.755573511123657e-06, 6.317161023616791e-06, 6.878748536109924e-06, 7.440336048603058e-06, 8.001923561096191e-06, 8.563511073589325e-06, 9.125098586082458e-06, 9.686686098575592e-06, 1.0248273611068726e-05, 1.0809861123561859e-05, 1.1371448636054993e-05, 1.1933036148548126e-05, 1.249462366104126e-05, 1.3056211173534393e-05, 1.3617798686027527e-05, 1.417938619852066e-05, 1.4740973711013794e-05, 1.5302561223506927e-05, 1.586414873600006e-05, 1.6425736248493195e-05, 1.6987323760986328e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 16.0, 6.0, 13.0, 28.0, 42.0, 68.0, 119.0, 174.0, 401.0, 722.0, 1783.0, 5335.0, 28212.0, 813208.0, 178992.0, 13520.0, 3413.0, 1305.0, 584.0, 264.0, 144.0, 77.0, 53.0, 27.0, 14.0, 14.0, 7.0, 7.0, 5.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06048583984375, -0.058696746826171875, -0.05690765380859375, -0.055118560791015625, -0.0533294677734375, -0.051540374755859375, -0.04975128173828125, -0.047962188720703125, -0.046173095703125, -0.044384002685546875, -0.04259490966796875, -0.040805816650390625, -0.0390167236328125, -0.037227630615234375, -0.03543853759765625, -0.033649444580078125, -0.0318603515625, -0.030071258544921875, -0.02828216552734375, -0.026493072509765625, -0.0247039794921875, -0.022914886474609375, -0.02112579345703125, -0.019336700439453125, -0.017547607421875, -0.015758514404296875, -0.01396942138671875, -0.012180328369140625, -0.0103912353515625, -0.008602142333984375, -0.00681304931640625, -0.005023956298828125, -0.00323486328125, -0.001445770263671875, 0.00034332275390625, 0.002132415771484375, 0.0039215087890625, 0.005710601806640625, 0.00749969482421875, 0.009288787841796875, 0.011077880859375, 0.012866973876953125, 0.01465606689453125, 0.016445159912109375, 0.0182342529296875, 0.020023345947265625, 0.02181243896484375, 0.023601531982421875, 0.025390625, 0.027179718017578125, 0.02896881103515625, 0.030757904052734375, 0.0325469970703125, 0.034336090087890625, 0.03612518310546875, 0.037914276123046875, 0.039703369140625, 0.041492462158203125, 0.04328155517578125, 0.045070648193359375, 0.0468597412109375, 0.048648834228515625, 0.05043792724609375, 0.052227020263671875, 0.05401611328125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 6.0, 1.0, 2.0, 4.0, 6.0, 5.0, 8.0, 9.0, 23.0, 39.0, 98.0, 237.0, 278.0, 123.0, 57.0, 25.0, 23.0, 21.0, 16.0, 7.0, 1.0, 4.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00982666015625, -0.009489297866821289, -0.009151935577392578, -0.008814573287963867, -0.008477210998535156, -0.008139848709106445, -0.007802486419677734, -0.0074651241302490234, -0.0071277618408203125, -0.0067903995513916016, -0.006453037261962891, -0.00611567497253418, -0.005778312683105469, -0.005440950393676758, -0.005103588104248047, -0.004766225814819336, -0.004428863525390625, -0.004091501235961914, -0.003754138946533203, -0.003416776657104492, -0.0030794143676757812, -0.0027420520782470703, -0.0024046897888183594, -0.0020673274993896484, -0.0017299652099609375, -0.0013926029205322266, -0.0010552406311035156, -0.0007178783416748047, -0.00038051605224609375, -4.315376281738281e-05, 0.0002942085266113281, 0.0006315708160400391, 0.00096893310546875, 0.001306295394897461, 0.0016436576843261719, 0.001981019973754883, 0.0023183822631835938, 0.0026557445526123047, 0.0029931068420410156, 0.0033304691314697266, 0.0036678314208984375, 0.0040051937103271484, 0.004342555999755859, 0.00467991828918457, 0.005017280578613281, 0.005354642868041992, 0.005692005157470703, 0.006029367446899414, 0.006366729736328125, 0.006704092025756836, 0.007041454315185547, 0.007378816604614258, 0.007716178894042969, 0.00805354118347168, 0.00839090347290039, 0.008728265762329102, 0.009065628051757812, 0.009402990341186523, 0.009740352630615234, 0.010077714920043945, 0.010415077209472656, 0.010752439498901367, 0.011089801788330078, 0.011427164077758789, 0.0117645263671875]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 5.0, 9.0, 12.0, 17.0, 18.0, 32.0, 46.0, 49.0, 75.0, 127.0, 145.0, 122.0, 108.0, 78.0, 47.0, 38.0, 21.0, 22.0, 8.0, 7.0, 2.0, 4.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.905573844909668, -1.8393712043762207, -1.7731685638427734, -1.7069660425186157, -1.6407634019851685, -1.5745607614517212, -1.5083582401275635, -1.4421555995941162, -1.375952959060669, -1.3097503185272217, -1.2435476779937744, -1.1773451566696167, -1.1111425161361694, -1.0449398756027222, -0.9787372946739197, -0.9125347137451172, -0.8463320732116699, -0.7801294326782227, -0.7139268517494202, -0.6477242708206177, -0.5815216302871704, -0.5153189897537231, -0.44911640882492065, -0.3829137980937958, -0.3167111873626709, -0.250508576631546, -0.18430596590042114, -0.11810335516929626, -0.05190074443817139, 0.014301866292953491, 0.08050447702407837, 0.14670708775520325, 0.21290946006774902, 0.2791120707988739, 0.3453146815299988, 0.41151729226112366, 0.47771990299224854, 0.5439225435256958, 0.6101251244544983, 0.6763277053833008, 0.742530345916748, 0.8087329864501953, 0.8749355673789978, 0.9411381483078003, 1.0073407888412476, 1.0735434293746948, 1.1397459506988525, 1.2059485912322998, 1.272151231765747, 1.3383538722991943, 1.4045565128326416, 1.4707590341567993, 1.5369616746902466, 1.6031643152236938, 1.6693668365478516, 1.7355694770812988, 1.801772117614746, 1.8679747581481934, 1.9341773986816406, 2.000380039215088, 2.066582679748535, 2.1327850818634033, 2.1989877223968506, 2.265190362930298, 2.331393003463745]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 7.0, 6.0, 12.0, 17.0, 20.0, 28.0, 33.0, 36.0, 42.0, 66.0, 82.0, 86.0, 88.0, 76.0, 77.0, 61.0, 49.0, 46.0, 43.0, 23.0, 21.0, 22.0, 13.0, 9.0, 7.0, 7.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.299004316329956, -1.2520140409469604, -1.2050237655639648, -1.1580333709716797, -1.111043095588684, -1.0640528202056885, -1.0170624256134033, -0.9700721502304077, -0.9230818748474121, -0.8760915994644165, -0.8291012644767761, -0.7821109294891357, -0.7351206541061401, -0.6881303787231445, -0.6411400437355042, -0.5941497087478638, -0.5471594333648682, -0.5001691579818726, -0.4531788229942322, -0.4061885178089142, -0.3591982126235962, -0.3122079074382782, -0.2652176022529602, -0.2182272970676422, -0.17123699188232422, -0.12424668669700623, -0.07725638151168823, -0.03026607632637024, 0.016724228858947754, 0.06371453404426575, 0.11070483922958374, 0.15769514441490173, 0.20468544960021973, 0.2516757547855377, 0.2986660599708557, 0.3456563651561737, 0.3926466703414917, 0.4396369755268097, 0.4866272807121277, 0.5336176156997681, 0.5806078910827637, 0.6275981664657593, 0.6745885014533997, 0.72157883644104, 0.7685691118240356, 0.8155593872070312, 0.8625497221946716, 0.909540057182312, 0.9565303325653076, 1.0035206079483032, 1.0505108833312988, 1.097501277923584, 1.1444915533065796, 1.1914818286895752, 1.2384722232818604, 1.285462498664856, 1.3324527740478516, 1.3794430494308472, 1.4264333248138428, 1.473423719406128, 1.5204139947891235, 1.5674042701721191, 1.6143946647644043, 1.6613849401474, 1.7083752155303955]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 1.0, 5.0, 15.0, 12.0, 30.0, 37.0, 48.0, 72.0, 164.0, 274.0, 411.0, 920.0, 1836.0, 4004.0, 10137.0, 28325.0, 97783.0, 581226.0, 237676.0, 55570.0, 17684.0, 6771.0, 2801.0, 1304.0, 654.0, 339.0, 171.0, 104.0, 74.0, 36.0, 22.0, 18.0, 10.0, 6.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01171875, -0.978851318359375, -0.94598388671875, -0.913116455078125, -0.8802490234375, -0.847381591796875, -0.81451416015625, -0.781646728515625, -0.748779296875, -0.715911865234375, -0.68304443359375, -0.650177001953125, -0.6173095703125, -0.584442138671875, -0.55157470703125, -0.518707275390625, -0.48583984375, -0.452972412109375, -0.42010498046875, -0.387237548828125, -0.3543701171875, -0.321502685546875, -0.28863525390625, -0.255767822265625, -0.222900390625, -0.190032958984375, -0.15716552734375, -0.124298095703125, -0.0914306640625, -0.058563232421875, -0.02569580078125, 0.007171630859375, 0.0400390625, 0.072906494140625, 0.10577392578125, 0.138641357421875, 0.1715087890625, 0.204376220703125, 0.23724365234375, 0.270111083984375, 0.302978515625, 0.335845947265625, 0.36871337890625, 0.401580810546875, 0.4344482421875, 0.467315673828125, 0.50018310546875, 0.533050537109375, 0.56591796875, 0.598785400390625, 0.63165283203125, 0.664520263671875, 0.6973876953125, 0.730255126953125, 0.76312255859375, 0.795989990234375, 0.828857421875, 0.861724853515625, 0.89459228515625, 0.927459716796875, 0.9603271484375, 0.993194580078125, 1.02606201171875, 1.058929443359375, 1.091796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 5.0, 13.0, 23.0, 13.0, 20.0, 43.0, 28.0, 58.0, 63.0, 76.0, 71.0, 99.0, 82.0, 80.0, 67.0, 51.0, 44.0, 42.0, 31.0, 19.0, 19.0, 7.0, 8.0, 8.0, 7.0, 3.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.486328125, -3.38861083984375, -3.2908935546875, -3.19317626953125, -3.095458984375, -2.99774169921875, -2.9000244140625, -2.80230712890625, -2.70458984375, -2.60687255859375, -2.5091552734375, -2.41143798828125, -2.313720703125, -2.21600341796875, -2.1182861328125, -2.02056884765625, -1.9228515625, -1.82513427734375, -1.7274169921875, -1.62969970703125, -1.531982421875, -1.43426513671875, -1.3365478515625, -1.23883056640625, -1.14111328125, -1.04339599609375, -0.9456787109375, -0.84796142578125, -0.750244140625, -0.65252685546875, -0.5548095703125, -0.45709228515625, -0.359375, -0.26165771484375, -0.1639404296875, -0.06622314453125, 0.031494140625, 0.12921142578125, 0.2269287109375, 0.32464599609375, 0.42236328125, 0.52008056640625, 0.6177978515625, 0.71551513671875, 0.813232421875, 0.91094970703125, 1.0086669921875, 1.10638427734375, 1.2041015625, 1.30181884765625, 1.3995361328125, 1.49725341796875, 1.594970703125, 1.69268798828125, 1.7904052734375, 1.88812255859375, 1.98583984375, 2.08355712890625, 2.1812744140625, 2.27899169921875, 2.376708984375, 2.47442626953125, 2.5721435546875, 2.66986083984375, 2.767578125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 6.0, 11.0, 12.0, 9.0, 12.0, 8.0, 17.0, 22.0, 17.0, 28.0, 33.0, 44.0, 53.0, 76.0, 124.0, 190.0, 394.0, 2084.0, 32591.0, 936770.0, 71548.0, 3249.0, 540.0, 220.0, 127.0, 101.0, 46.0, 45.0, 25.0, 28.0, 24.0, 21.0, 20.0, 10.0, 13.0, 6.0, 4.0, 6.0, 9.0, 2.0, 1.0, 1.0, 4.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.884765625, -2.7802734375, -2.67578125, -2.5712890625, -2.466796875, -2.3623046875, -2.2578125, -2.1533203125, -2.048828125, -1.9443359375, -1.83984375, -1.7353515625, -1.630859375, -1.5263671875, -1.421875, -1.3173828125, -1.212890625, -1.1083984375, -1.00390625, -0.8994140625, -0.794921875, -0.6904296875, -0.5859375, -0.4814453125, -0.376953125, -0.2724609375, -0.16796875, -0.0634765625, 0.041015625, 0.1455078125, 0.25, 0.3544921875, 0.458984375, 0.5634765625, 0.66796875, 0.7724609375, 0.876953125, 0.9814453125, 1.0859375, 1.1904296875, 1.294921875, 1.3994140625, 1.50390625, 1.6083984375, 1.712890625, 1.8173828125, 1.921875, 2.0263671875, 2.130859375, 2.2353515625, 2.33984375, 2.4443359375, 2.548828125, 2.6533203125, 2.7578125, 2.8623046875, 2.966796875, 3.0712890625, 3.17578125, 3.2802734375, 3.384765625, 3.4892578125, 3.59375, 3.6982421875, 3.802734375]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 8.0, 6.0, 12.0, 13.0, 12.0, 7.0, 20.0, 19.0, 15.0, 32.0, 28.0, 39.0, 35.0, 39.0, 45.0, 53.0, 49.0, 40.0, 50.0, 44.0, 62.0, 40.0, 38.0, 41.0, 30.0, 33.0, 30.0, 25.0, 30.0, 16.0, 15.0, 15.0, 14.0, 8.0, 6.0, 11.0, 8.0, 4.0, 4.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.603515625, -2.52197265625, -2.4404296875, -2.35888671875, -2.27734375, -2.19580078125, -2.1142578125, -2.03271484375, -1.951171875, -1.86962890625, -1.7880859375, -1.70654296875, -1.625, -1.54345703125, -1.4619140625, -1.38037109375, -1.298828125, -1.21728515625, -1.1357421875, -1.05419921875, -0.97265625, -0.89111328125, -0.8095703125, -0.72802734375, -0.646484375, -0.56494140625, -0.4833984375, -0.40185546875, -0.3203125, -0.23876953125, -0.1572265625, -0.07568359375, 0.005859375, 0.08740234375, 0.1689453125, 0.25048828125, 0.33203125, 0.41357421875, 0.4951171875, 0.57666015625, 0.658203125, 0.73974609375, 0.8212890625, 0.90283203125, 0.984375, 1.06591796875, 1.1474609375, 1.22900390625, 1.310546875, 1.39208984375, 1.4736328125, 1.55517578125, 1.63671875, 1.71826171875, 1.7998046875, 1.88134765625, 1.962890625, 2.04443359375, 2.1259765625, 2.20751953125, 2.2890625, 2.37060546875, 2.4521484375, 2.53369140625, 2.615234375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 5.0, 1.0, 4.0, 5.0, 11.0, 9.0, 13.0, 15.0, 20.0, 33.0, 43.0, 47.0, 70.0, 98.0, 208.0, 455.0, 1004.0, 2928.0, 10157.0, 54062.0, 677547.0, 259803.0, 31323.0, 6926.0, 2090.0, 768.0, 347.0, 201.0, 98.0, 54.0, 35.0, 42.0, 32.0, 22.0, 17.0, 21.0, 12.0, 9.0, 4.0, 8.0, 6.0, 5.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64453125, -0.624298095703125, -0.60406494140625, -0.583831787109375, -0.5635986328125, -0.543365478515625, -0.52313232421875, -0.502899169921875, -0.482666015625, -0.462432861328125, -0.44219970703125, -0.421966552734375, -0.4017333984375, -0.381500244140625, -0.36126708984375, -0.341033935546875, -0.32080078125, -0.300567626953125, -0.28033447265625, -0.260101318359375, -0.2398681640625, -0.219635009765625, -0.19940185546875, -0.179168701171875, -0.158935546875, -0.138702392578125, -0.11846923828125, -0.098236083984375, -0.0780029296875, -0.057769775390625, -0.03753662109375, -0.017303466796875, 0.0029296875, 0.023162841796875, 0.04339599609375, 0.063629150390625, 0.0838623046875, 0.104095458984375, 0.12432861328125, 0.144561767578125, 0.164794921875, 0.185028076171875, 0.20526123046875, 0.225494384765625, 0.2457275390625, 0.265960693359375, 0.28619384765625, 0.306427001953125, 0.32666015625, 0.346893310546875, 0.36712646484375, 0.387359619140625, 0.4075927734375, 0.427825927734375, 0.44805908203125, 0.468292236328125, 0.488525390625, 0.508758544921875, 0.52899169921875, 0.549224853515625, 0.5694580078125, 0.589691162109375, 0.60992431640625, 0.630157470703125, 0.650390625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 8.0, 9.0, 9.0, 14.0, 17.0, 24.0, 33.0, 57.0, 55.0, 117.0, 246.0, 138.0, 64.0, 55.0, 44.0, 26.0, 18.0, 20.0, 12.0, 14.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.0001291036605834961, -0.00012614484876394272, -0.00012318603694438934, -0.00012022722512483597, -0.00011726841330528259, -0.00011430960148572922, -0.00011135078966617584, -0.00010839197784662247, -0.00010543316602706909, -0.00010247435420751572, -9.951554238796234e-05, -9.655673056840897e-05, -9.359791874885559e-05, -9.063910692930222e-05, -8.768029510974884e-05, -8.472148329019547e-05, -8.176267147064209e-05, -7.880385965108871e-05, -7.584504783153534e-05, -7.288623601198196e-05, -6.992742419242859e-05, -6.696861237287521e-05, -6.400980055332184e-05, -6.105098873376846e-05, -5.809217691421509e-05, -5.513336509466171e-05, -5.217455327510834e-05, -4.921574145555496e-05, -4.625692963600159e-05, -4.329811781644821e-05, -4.0339305996894836e-05, -3.738049417734146e-05, -3.4421682357788086e-05, -3.146287053823471e-05, -2.8504058718681335e-05, -2.554524689912796e-05, -2.2586435079574585e-05, -1.962762326002121e-05, -1.6668811440467834e-05, -1.370999962091446e-05, -1.0751187801361084e-05, -7.792375981807709e-06, -4.8335641622543335e-06, -1.8747523427009583e-06, 1.084059476852417e-06, 4.042871296405792e-06, 7.0016831159591675e-06, 9.960494935512543e-06, 1.2919306755065918e-05, 1.5878118574619293e-05, 1.883693039417267e-05, 2.1795742213726044e-05, 2.475455403327942e-05, 2.7713365852832794e-05, 3.067217767238617e-05, 3.3630989491939545e-05, 3.658980131149292e-05, 3.9548613131046295e-05, 4.250742495059967e-05, 4.5466236770153046e-05, 4.842504858970642e-05, 5.1383860409259796e-05, 5.434267222881317e-05, 5.730148404836655e-05, 6.026029586791992e-05]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 8.0, 14.0, 21.0, 23.0, 43.0, 73.0, 109.0, 237.0, 493.0, 1135.0, 3338.0, 12317.0, 60172.0, 662384.0, 259340.0, 36602.0, 8065.0, 2438.0, 912.0, 369.0, 185.0, 105.0, 64.0, 36.0, 17.0, 14.0, 11.0, 10.0, 10.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.5427780151367188, -0.5225677490234375, -0.5023574829101562, -0.482147216796875, -0.46193695068359375, -0.4417266845703125, -0.42151641845703125, -0.40130615234375, -0.38109588623046875, -0.3608856201171875, -0.34067535400390625, -0.320465087890625, -0.30025482177734375, -0.2800445556640625, -0.25983428955078125, -0.2396240234375, -0.21941375732421875, -0.1992034912109375, -0.17899322509765625, -0.158782958984375, -0.13857269287109375, -0.1183624267578125, -0.09815216064453125, -0.07794189453125, -0.05773162841796875, -0.0375213623046875, -0.01731109619140625, 0.002899169921875, 0.02310943603515625, 0.0433197021484375, 0.06352996826171875, 0.083740234375, 0.10395050048828125, 0.1241607666015625, 0.14437103271484375, 0.164581298828125, 0.18479156494140625, 0.2050018310546875, 0.22521209716796875, 0.24542236328125, 0.26563262939453125, 0.2858428955078125, 0.30605316162109375, 0.326263427734375, 0.34647369384765625, 0.3666839599609375, 0.38689422607421875, 0.4071044921875, 0.42731475830078125, 0.4475250244140625, 0.46773529052734375, 0.487945556640625, 0.5081558227539062, 0.5283660888671875, 0.5485763549804688, 0.56878662109375, 0.5889968872070312, 0.6092071533203125, 0.6294174194335938, 0.649627685546875, 0.6698379516601562, 0.6900482177734375, 0.7102584838867188, 0.73046875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 10.0, 9.0, 9.0, 5.0, 16.0, 31.0, 30.0, 45.0, 63.0, 99.0, 251.0, 165.0, 78.0, 47.0, 35.0, 18.0, 17.0, 15.0, 11.0, 7.0, 8.0, 3.0, 5.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3369140625, -0.3282184600830078, -0.3195228576660156, -0.31082725524902344, -0.30213165283203125, -0.29343605041503906, -0.2847404479980469, -0.2760448455810547, -0.2673492431640625, -0.2586536407470703, -0.24995803833007812, -0.24126243591308594, -0.23256683349609375, -0.22387123107910156, -0.21517562866210938, -0.2064800262451172, -0.197784423828125, -0.1890888214111328, -0.18039321899414062, -0.17169761657714844, -0.16300201416015625, -0.15430641174316406, -0.14561080932617188, -0.1369152069091797, -0.1282196044921875, -0.11952400207519531, -0.11082839965820312, -0.10213279724121094, -0.09343719482421875, -0.08474159240722656, -0.07604598999023438, -0.06735038757324219, -0.05865478515625, -0.04995918273925781, -0.041263580322265625, -0.03256797790527344, -0.02387237548828125, -0.015176773071289062, -0.006481170654296875, 0.0022144317626953125, 0.0109100341796875, 0.019605636596679688, 0.028301239013671875, 0.03699684143066406, 0.04569244384765625, 0.05438804626464844, 0.06308364868164062, 0.07177925109863281, 0.080474853515625, 0.08917045593261719, 0.09786605834960938, 0.10656166076660156, 0.11525726318359375, 0.12395286560058594, 0.13264846801757812, 0.1413440704345703, 0.1500396728515625, 0.1587352752685547, 0.16743087768554688, 0.17612648010253906, 0.18482208251953125, 0.19351768493652344, 0.20221328735351562, 0.2109088897705078, 0.2196044921875]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 9.0, 20.0, 105.0, 370.0, 398.0, 87.0, 18.0, 4.0, 4.0, 0.0, 1.0], "bins": [-30.861248016357422, -30.31949234008789, -29.77773666381836, -29.235980987548828, -28.694225311279297, -28.152469635009766, -27.610713958740234, -27.068958282470703, -26.527202606201172, -25.98544692993164, -25.44369125366211, -24.901935577392578, -24.360179901123047, -23.818424224853516, -23.276668548583984, -22.734912872314453, -22.193157196044922, -21.65140151977539, -21.10964584350586, -20.567890167236328, -20.026134490966797, -19.484378814697266, -18.942623138427734, -18.400867462158203, -17.859113693237305, -17.317358016967773, -16.775602340698242, -16.23384666442871, -15.69209098815918, -15.150335311889648, -14.608579635620117, -14.066823959350586, -13.525069236755371, -12.98331356048584, -12.441557884216309, -11.899802207946777, -11.358046531677246, -10.816290855407715, -10.2745361328125, -9.732780456542969, -9.191023826599121, -8.64926815032959, -8.107512474060059, -7.565756797790527, -7.024001121520996, -6.482245445251465, -5.940490245819092, -5.3987345695495605, -4.8569793701171875, -4.315223693847656, -3.773468017578125, -3.231712579727173, -2.6899569034576416, -2.1482012271881104, -1.6064457893371582, -1.064690113067627, -0.5229341983795166, 0.018821418285369873, 0.5605770349502563, 1.102332592010498, 1.6440882682800293, 2.1858439445495605, 2.7275993824005127, 3.269355058670044, 3.811110734939575]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 6.0, 3.0, 2.0, 1.0, 4.0, 9.0, 9.0, 10.0, 10.0, 19.0, 18.0, 15.0, 15.0, 28.0, 30.0, 26.0, 40.0, 38.0, 37.0, 39.0, 30.0, 60.0, 48.0, 36.0, 47.0, 41.0, 38.0, 40.0, 34.0, 32.0, 33.0, 24.0, 26.0, 25.0, 21.0, 22.0, 13.0, 21.0, 9.0, 16.0, 7.0, 5.0, 3.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.071616172790527, -3.9486749172210693, -3.8257334232330322, -3.702792167663574, -3.579850912094116, -3.456909656524658, -3.333968162536621, -3.211026906967163, -3.088085651397705, -2.965144395828247, -2.84220290184021, -2.719261646270752, -2.596320390701294, -2.473379135131836, -2.350437641143799, -2.227496385574341, -2.1045548915863037, -1.9816135168075562, -1.8586722612380981, -1.7357308864593506, -1.6127896308898926, -1.489848256111145, -1.3669068813323975, -1.2439656257629395, -1.121024250984192, -0.9980829358100891, -0.8751416206359863, -0.7522002458572388, -0.629258930683136, -0.5063176155090332, -0.38337624073028564, -0.26043492555618286, -0.13749337196350098, -0.014552041888237, 0.10838928818702698, 0.23133063316345215, 0.35427194833755493, 0.4772132635116577, 0.6001546382904053, 0.7230959534645081, 0.8460372686386108, 0.9689785838127136, 1.0919198989868164, 1.214861273765564, 1.3378026485443115, 1.4607439041137695, 1.583685278892517, 1.7066266536712646, 1.8295679092407227, 1.9525092840194702, 2.0754506587982178, 2.198391914367676, 2.321333169937134, 2.444274425506592, 2.567215919494629, 2.690157175064087, 2.813098430633545, 2.936039686203003, 3.05898118019104, 3.181922435760498, 3.304863691329956, 3.427804946899414, 3.550746440887451, 3.673687696456909, 3.7966291904449463]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 2.0, 3.0, 3.0, 3.0, 8.0, 13.0, 12.0, 19.0, 21.0, 38.0, 36.0, 46.0, 93.0, 117.0, 171.0, 273.0, 378.0, 612.0, 882.0, 1624.0, 2935.0, 5987.0, 14510.0, 42651.0, 189182.0, 2183886.0, 1534288.0, 153611.0, 37499.0, 13002.0, 5537.0, 2725.0, 1497.0, 888.0, 519.0, 377.0, 256.0, 138.0, 125.0, 77.0, 70.0, 35.0, 32.0, 26.0, 16.0, 18.0, 10.0, 8.0, 8.0, 4.0, 3.0, 3.0, 1.0, 6.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.70703125, -1.6535797119140625, -1.600128173828125, -1.5466766357421875, -1.49322509765625, -1.4397735595703125, -1.386322021484375, -1.3328704833984375, -1.2794189453125, -1.2259674072265625, -1.172515869140625, -1.1190643310546875, -1.06561279296875, -1.0121612548828125, -0.958709716796875, -0.9052581787109375, -0.851806640625, -0.7983551025390625, -0.744903564453125, -0.6914520263671875, -0.63800048828125, -0.5845489501953125, -0.531097412109375, -0.4776458740234375, -0.4241943359375, -0.3707427978515625, -0.317291259765625, -0.2638397216796875, -0.21038818359375, -0.1569366455078125, -0.103485107421875, -0.0500335693359375, 0.00341796875, 0.0568695068359375, 0.110321044921875, 0.1637725830078125, 0.21722412109375, 0.2706756591796875, 0.324127197265625, 0.3775787353515625, 0.4310302734375, 0.4844818115234375, 0.537933349609375, 0.5913848876953125, 0.64483642578125, 0.6982879638671875, 0.751739501953125, 0.8051910400390625, 0.858642578125, 0.9120941162109375, 0.965545654296875, 1.0189971923828125, 1.07244873046875, 1.1259002685546875, 1.179351806640625, 1.2328033447265625, 1.2862548828125, 1.3397064208984375, 1.393157958984375, 1.4466094970703125, 1.50006103515625, 1.5535125732421875, 1.606964111328125, 1.6604156494140625, 1.7138671875]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 11.0, 6.0, 10.0, 21.0, 24.0, 27.0, 40.0, 57.0, 55.0, 68.0, 82.0, 96.0, 78.0, 73.0, 69.0, 58.0, 49.0, 41.0, 25.0, 25.0, 9.0, 21.0, 12.0, 3.0, 8.0, 9.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.470703125, -1.426055908203125, -1.38140869140625, -1.336761474609375, -1.2921142578125, -1.247467041015625, -1.20281982421875, -1.158172607421875, -1.113525390625, -1.068878173828125, -1.02423095703125, -0.979583740234375, -0.9349365234375, -0.890289306640625, -0.84564208984375, -0.800994873046875, -0.75634765625, -0.711700439453125, -0.66705322265625, -0.622406005859375, -0.5777587890625, -0.533111572265625, -0.48846435546875, -0.443817138671875, -0.399169921875, -0.354522705078125, -0.30987548828125, -0.265228271484375, -0.2205810546875, -0.175933837890625, -0.13128662109375, -0.086639404296875, -0.0419921875, 0.002655029296875, 0.04730224609375, 0.091949462890625, 0.1365966796875, 0.181243896484375, 0.22589111328125, 0.270538330078125, 0.315185546875, 0.359832763671875, 0.40447998046875, 0.449127197265625, 0.4937744140625, 0.538421630859375, 0.58306884765625, 0.627716064453125, 0.67236328125, 0.717010498046875, 0.76165771484375, 0.806304931640625, 0.8509521484375, 0.895599365234375, 0.94024658203125, 0.984893798828125, 1.029541015625, 1.074188232421875, 1.11883544921875, 1.163482666015625, 1.2081298828125, 1.252777099609375, 1.29742431640625, 1.342071533203125, 1.38671875]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 0.0, 5.0, 2.0, 4.0, 7.0, 2.0, 7.0, 9.0, 15.0, 21.0, 26.0, 46.0, 73.0, 78.0, 130.0, 211.0, 484.0, 1194.0, 3690.0, 17262.0, 136666.0, 3108200.0, 856963.0, 56150.0, 9080.0, 2199.0, 810.0, 365.0, 200.0, 112.0, 61.0, 57.0, 47.0, 29.0, 20.0, 20.0, 13.0, 6.0, 4.0, 4.0, 5.0, 6.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-3.513671875, -3.4127197265625, -3.311767578125, -3.2108154296875, -3.10986328125, -3.0089111328125, -2.907958984375, -2.8070068359375, -2.7060546875, -2.6051025390625, -2.504150390625, -2.4031982421875, -2.30224609375, -2.2012939453125, -2.100341796875, -1.9993896484375, -1.8984375, -1.7974853515625, -1.696533203125, -1.5955810546875, -1.49462890625, -1.3936767578125, -1.292724609375, -1.1917724609375, -1.0908203125, -0.9898681640625, -0.888916015625, -0.7879638671875, -0.68701171875, -0.5860595703125, -0.485107421875, -0.3841552734375, -0.283203125, -0.1822509765625, -0.081298828125, 0.0196533203125, 0.12060546875, 0.2215576171875, 0.322509765625, 0.4234619140625, 0.5244140625, 0.6253662109375, 0.726318359375, 0.8272705078125, 0.92822265625, 1.0291748046875, 1.130126953125, 1.2310791015625, 1.33203125, 1.4329833984375, 1.533935546875, 1.6348876953125, 1.73583984375, 1.8367919921875, 1.937744140625, 2.0386962890625, 2.1396484375, 2.2406005859375, 2.341552734375, 2.4425048828125, 2.54345703125, 2.6444091796875, 2.745361328125, 2.8463134765625, 2.947265625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 9.0, 11.0, 13.0, 10.0, 17.0, 25.0, 27.0, 40.0, 60.0, 82.0, 141.0, 224.0, 240.0, 465.0, 726.0, 682.0, 438.0, 245.0, 187.0, 125.0, 98.0, 63.0, 52.0, 23.0, 21.0, 18.0, 13.0, 9.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55712890625, -0.5338897705078125, -0.510650634765625, -0.4874114990234375, -0.46417236328125, -0.4409332275390625, -0.417694091796875, -0.3944549560546875, -0.3712158203125, -0.3479766845703125, -0.324737548828125, -0.3014984130859375, -0.27825927734375, -0.2550201416015625, -0.231781005859375, -0.2085418701171875, -0.185302734375, -0.1620635986328125, -0.138824462890625, -0.1155853271484375, -0.09234619140625, -0.0691070556640625, -0.045867919921875, -0.0226287841796875, 0.0006103515625, 0.0238494873046875, 0.047088623046875, 0.0703277587890625, 0.09356689453125, 0.1168060302734375, 0.140045166015625, 0.1632843017578125, 0.1865234375, 0.2097625732421875, 0.233001708984375, 0.2562408447265625, 0.27947998046875, 0.3027191162109375, 0.325958251953125, 0.3491973876953125, 0.3724365234375, 0.3956756591796875, 0.418914794921875, 0.4421539306640625, 0.46539306640625, 0.4886322021484375, 0.511871337890625, 0.5351104736328125, 0.558349609375, 0.5815887451171875, 0.604827880859375, 0.6280670166015625, 0.65130615234375, 0.6745452880859375, 0.697784423828125, 0.7210235595703125, 0.7442626953125, 0.7675018310546875, 0.790740966796875, 0.8139801025390625, 0.83721923828125, 0.8604583740234375, 0.883697509765625, 0.9069366455078125, 0.93017578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 5.0, 4.0, 9.0, 24.0, 22.0, 29.0, 46.0, 68.0, 103.0, 97.0, 111.0, 118.0, 87.0, 74.0, 59.0, 39.0, 39.0, 23.0, 24.0, 13.0, 8.0, 1.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.699397325515747, -3.606414556503296, -3.513432025909424, -3.4204492568969727, -3.3274667263031006, -3.2344839572906494, -3.1415014266967773, -3.048518657684326, -2.955535888671875, -2.862553119659424, -2.7695705890655518, -2.6765878200531006, -2.5836052894592285, -2.4906225204467773, -2.397639751434326, -2.304657220840454, -2.211674690246582, -2.118691921234131, -2.025709390640259, -1.9327266216278076, -1.8397440910339355, -1.7467613220214844, -1.6537786722183228, -1.5607960224151611, -1.4678133726119995, -1.374830722808838, -1.2818480730056763, -1.1888654232025146, -1.0958826541900635, -1.0029001235961914, -0.9099173545837402, -0.8169347047805786, -0.7239522933959961, -0.6309696435928345, -0.5379869937896729, -0.44500428438186646, -0.35202163457870483, -0.2590389847755432, -0.16605627536773682, -0.0730736255645752, 0.019909024238586426, 0.11289168894290924, 0.20587435364723206, 0.29885703325271606, 0.3918396830558777, 0.4848223328590393, 0.5778050422668457, 0.6707876920700073, 0.763770341873169, 0.8567529916763306, 0.9497356414794922, 1.0427184104919434, 1.1357009410858154, 1.2286837100982666, 1.3216663599014282, 1.4146490097045898, 1.5076316595077515, 1.600614309310913, 1.6935969591140747, 1.7865796089172363, 1.8795623779296875, 1.9725449085235596, 2.0655276775360107, 2.158510208129883, 2.251492977142334]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 8.0, 16.0, 10.0, 14.0, 15.0, 32.0, 19.0, 21.0, 34.0, 31.0, 43.0, 47.0, 44.0, 46.0, 50.0, 53.0, 43.0, 32.0, 44.0, 36.0, 39.0, 39.0, 34.0, 35.0, 35.0, 21.0, 26.0, 33.0, 15.0, 15.0, 13.0, 10.0, 9.0, 6.0, 7.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4027278423309326, -1.353599190711975, -1.3044705390930176, -1.2553417682647705, -1.206213116645813, -1.1570844650268555, -1.107955813407898, -1.0588271617889404, -1.009698510169983, -0.9605698585510254, -0.9114411473274231, -0.8623124957084656, -0.8131838440895081, -0.7640551328659058, -0.7149264812469482, -0.6657978296279907, -0.6166691184043884, -0.5675404667854309, -0.5184117555618286, -0.4692831039428711, -0.4201544523239136, -0.37102577090263367, -0.32189708948135376, -0.27276843786239624, -0.22363975644111633, -0.17451108992099762, -0.1253824234008789, -0.076253741979599, -0.027125075459480286, 0.022003591060638428, 0.07113227248191833, 0.12026092410087585, 0.16938960552215576, 0.21851827204227448, 0.2676469385623932, 0.3167756199836731, 0.3659042716026306, 0.4150329530239105, 0.46416163444519043, 0.513290286064148, 0.5624189376831055, 0.611547589302063, 0.6606763005256653, 0.7098049521446228, 0.7589336037635803, 0.8080623149871826, 0.8571909666061401, 0.9063196182250977, 0.9554483294487, 1.0045770406723022, 1.0537056922912598, 1.1028343439102173, 1.1519629955291748, 1.2010916471481323, 1.2502202987670898, 1.299349069595337, 1.3484777212142944, 1.397606372833252, 1.4467350244522095, 1.495863676071167, 1.544992446899414, 1.5941210985183716, 1.643249750137329, 1.6923784017562866, 1.7415070533752441]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 8.0, 3.0, 6.0, 9.0, 11.0, 16.0, 21.0, 36.0, 41.0, 65.0, 79.0, 159.0, 236.0, 504.0, 1245.0, 3865.0, 16066.0, 126295.0, 771487.0, 108050.0, 14493.0, 3456.0, 1221.0, 490.0, 241.0, 144.0, 95.0, 49.0, 39.0, 40.0, 17.0, 17.0, 15.0, 15.0, 5.0, 11.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.287353515625, -0.27725982666015625, -0.2671661376953125, -0.25707244873046875, -0.246978759765625, -0.23688507080078125, -0.2267913818359375, -0.21669769287109375, -0.20660400390625, -0.19651031494140625, -0.1864166259765625, -0.17632293701171875, -0.166229248046875, -0.15613555908203125, -0.1460418701171875, -0.13594818115234375, -0.1258544921875, -0.11576080322265625, -0.1056671142578125, -0.09557342529296875, -0.085479736328125, -0.07538604736328125, -0.0652923583984375, -0.05519866943359375, -0.04510498046875, -0.03501129150390625, -0.0249176025390625, -0.01482391357421875, -0.004730224609375, 0.00536346435546875, 0.0154571533203125, 0.02555084228515625, 0.03564453125, 0.04573822021484375, 0.0558319091796875, 0.06592559814453125, 0.076019287109375, 0.08611297607421875, 0.0962066650390625, 0.10630035400390625, 0.11639404296875, 0.12648773193359375, 0.1365814208984375, 0.14667510986328125, 0.156768798828125, 0.16686248779296875, 0.1769561767578125, 0.18704986572265625, 0.1971435546875, 0.20723724365234375, 0.2173309326171875, 0.22742462158203125, 0.237518310546875, 0.24761199951171875, 0.2577056884765625, 0.26779937744140625, 0.27789306640625, 0.28798675537109375, 0.2980804443359375, 0.30817413330078125, 0.318267822265625, 0.32836151123046875, 0.3384552001953125, 0.34854888916015625, 0.358642578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 4.0, 5.0, 14.0, 9.0, 9.0, 18.0, 22.0, 31.0, 28.0, 32.0, 36.0, 38.0, 51.0, 62.0, 60.0, 50.0, 51.0, 39.0, 57.0, 53.0, 45.0, 39.0, 41.0, 37.0, 35.0, 26.0, 22.0, 19.0, 16.0, 11.0, 6.0, 12.0, 4.0, 8.0, 6.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.018829345703125, -0.98199462890625, -0.945159912109375, -0.9083251953125, -0.871490478515625, -0.83465576171875, -0.797821044921875, -0.760986328125, -0.724151611328125, -0.68731689453125, -0.650482177734375, -0.6136474609375, -0.576812744140625, -0.53997802734375, -0.503143310546875, -0.46630859375, -0.429473876953125, -0.39263916015625, -0.355804443359375, -0.3189697265625, -0.282135009765625, -0.24530029296875, -0.208465576171875, -0.171630859375, -0.134796142578125, -0.09796142578125, -0.061126708984375, -0.0242919921875, 0.012542724609375, 0.04937744140625, 0.086212158203125, 0.123046875, 0.159881591796875, 0.19671630859375, 0.233551025390625, 0.2703857421875, 0.307220458984375, 0.34405517578125, 0.380889892578125, 0.417724609375, 0.454559326171875, 0.49139404296875, 0.528228759765625, 0.5650634765625, 0.601898193359375, 0.63873291015625, 0.675567626953125, 0.71240234375, 0.749237060546875, 0.78607177734375, 0.822906494140625, 0.8597412109375, 0.896575927734375, 0.93341064453125, 0.970245361328125, 1.007080078125, 1.043914794921875, 1.08074951171875, 1.117584228515625, 1.1544189453125, 1.191253662109375, 1.22808837890625, 1.264923095703125, 1.3017578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 5.0, 4.0, 7.0, 8.0, 14.0, 8.0, 20.0, 22.0, 27.0, 36.0, 45.0, 73.0, 82.0, 101.0, 126.0, 200.0, 242.0, 350.0, 705.0, 2329.0, 13126.0, 150145.0, 789132.0, 79586.0, 8490.0, 1829.0, 658.0, 292.0, 226.0, 163.0, 120.0, 111.0, 71.0, 46.0, 32.0, 19.0, 31.0, 21.0, 11.0, 11.0, 7.0, 8.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2237548828125, -0.21639060974121094, -0.20902633666992188, -0.2016620635986328, -0.19429779052734375, -0.1869335174560547, -0.17956924438476562, -0.17220497131347656, -0.1648406982421875, -0.15747642517089844, -0.15011215209960938, -0.1427478790283203, -0.13538360595703125, -0.1280193328857422, -0.12065505981445312, -0.11329078674316406, -0.105926513671875, -0.09856224060058594, -0.09119796752929688, -0.08383369445800781, -0.07646942138671875, -0.06910514831542969, -0.061740875244140625, -0.05437660217285156, -0.0470123291015625, -0.03964805603027344, -0.032283782958984375, -0.024919509887695312, -0.01755523681640625, -0.010190963745117188, -0.002826690673828125, 0.0045375823974609375, 0.01190185546875, 0.019266128540039062, 0.026630401611328125, 0.03399467468261719, 0.04135894775390625, 0.04872322082519531, 0.056087493896484375, 0.06345176696777344, 0.0708160400390625, 0.07818031311035156, 0.08554458618164062, 0.09290885925292969, 0.10027313232421875, 0.10763740539550781, 0.11500167846679688, 0.12236595153808594, 0.129730224609375, 0.13709449768066406, 0.14445877075195312, 0.1518230438232422, 0.15918731689453125, 0.1665515899658203, 0.17391586303710938, 0.18128013610839844, 0.1886444091796875, 0.19600868225097656, 0.20337295532226562, 0.2107372283935547, 0.21810150146484375, 0.2254657745361328, 0.23283004760742188, 0.24019432067871094, 0.24755859375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 6.0, 6.0, 1.0, 3.0, 3.0, 11.0, 7.0, 11.0, 18.0, 21.0, 27.0, 18.0, 29.0, 35.0, 35.0, 34.0, 37.0, 50.0, 43.0, 55.0, 50.0, 40.0, 62.0, 40.0, 42.0, 42.0, 41.0, 33.0, 36.0, 27.0, 26.0, 20.0, 16.0, 16.0, 13.0, 7.0, 2.0, 8.0, 12.0, 8.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.9345703125, -1.8699798583984375, -1.805389404296875, -1.7407989501953125, -1.67620849609375, -1.6116180419921875, -1.547027587890625, -1.4824371337890625, -1.4178466796875, -1.3532562255859375, -1.288665771484375, -1.2240753173828125, -1.15948486328125, -1.0948944091796875, -1.030303955078125, -0.9657135009765625, -0.901123046875, -0.8365325927734375, -0.771942138671875, -0.7073516845703125, -0.64276123046875, -0.5781707763671875, -0.513580322265625, -0.4489898681640625, -0.3843994140625, -0.3198089599609375, -0.255218505859375, -0.1906280517578125, -0.12603759765625, -0.0614471435546875, 0.003143310546875, 0.0677337646484375, 0.13232421875, 0.1969146728515625, 0.261505126953125, 0.3260955810546875, 0.39068603515625, 0.4552764892578125, 0.519866943359375, 0.5844573974609375, 0.6490478515625, 0.7136383056640625, 0.778228759765625, 0.8428192138671875, 0.90740966796875, 0.9720001220703125, 1.036590576171875, 1.1011810302734375, 1.165771484375, 1.2303619384765625, 1.294952392578125, 1.3595428466796875, 1.42413330078125, 1.4887237548828125, 1.553314208984375, 1.6179046630859375, 1.6824951171875, 1.7470855712890625, 1.811676025390625, 1.8762664794921875, 1.94085693359375, 2.0054473876953125, 2.070037841796875, 2.1346282958984375, 2.19921875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 14.0, 19.0, 31.0, 41.0, 62.0, 89.0, 76.0, 137.0, 207.0, 333.0, 762.0, 3655.0, 61991.0, 952439.0, 24976.0, 2215.0, 562.0, 301.0, 162.0, 114.0, 87.0, 64.0, 51.0, 34.0, 29.0, 17.0, 10.0, 14.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057708740234375, -0.055869102478027344, -0.05402946472167969, -0.05218982696533203, -0.050350189208984375, -0.04851055145263672, -0.04667091369628906, -0.044831275939941406, -0.04299163818359375, -0.041152000427246094, -0.03931236267089844, -0.03747272491455078, -0.035633087158203125, -0.03379344940185547, -0.03195381164550781, -0.030114173889160156, -0.0282745361328125, -0.026434898376464844, -0.024595260620117188, -0.02275562286376953, -0.020915985107421875, -0.01907634735107422, -0.017236709594726562, -0.015397071838378906, -0.01355743408203125, -0.011717796325683594, -0.009878158569335938, -0.008038520812988281, -0.006198883056640625, -0.004359245300292969, -0.0025196075439453125, -0.0006799697875976562, 0.00115966796875, 0.0029993057250976562, 0.0048389434814453125, 0.006678581237792969, 0.008518218994140625, 0.010357856750488281, 0.012197494506835938, 0.014037132263183594, 0.01587677001953125, 0.017716407775878906, 0.019556045532226562, 0.02139568328857422, 0.023235321044921875, 0.02507495880126953, 0.026914596557617188, 0.028754234313964844, 0.0305938720703125, 0.032433509826660156, 0.03427314758300781, 0.03611278533935547, 0.037952423095703125, 0.03979206085205078, 0.04163169860839844, 0.043471336364746094, 0.04531097412109375, 0.047150611877441406, 0.04899024963378906, 0.05082988739013672, 0.052669525146484375, 0.05450916290283203, 0.05634880065917969, 0.058188438415527344, 0.060028076171875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 6.0, 7.0, 14.0, 11.0, 19.0, 33.0, 31.0, 44.0, 61.0, 64.0, 86.0, 89.0, 84.0, 90.0, 82.0, 65.0, 42.0, 36.0, 35.0, 15.0, 19.0, 19.0, 12.0, 9.0, 5.0, 8.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.4020671844482422e-05, -2.3437663912773132e-05, -2.2854655981063843e-05, -2.2271648049354553e-05, -2.1688640117645264e-05, -2.1105632185935974e-05, -2.0522624254226685e-05, -1.9939616322517395e-05, -1.9356608390808105e-05, -1.8773600459098816e-05, -1.8190592527389526e-05, -1.7607584595680237e-05, -1.7024576663970947e-05, -1.6441568732261658e-05, -1.5858560800552368e-05, -1.527555286884308e-05, -1.4692544937133789e-05, -1.41095370054245e-05, -1.352652907371521e-05, -1.294352114200592e-05, -1.2360513210296631e-05, -1.1777505278587341e-05, -1.1194497346878052e-05, -1.0611489415168762e-05, -1.0028481483459473e-05, -9.445473551750183e-06, -8.862465620040894e-06, -8.279457688331604e-06, -7.696449756622314e-06, -7.113441824913025e-06, -6.530433893203735e-06, -5.947425961494446e-06, -5.364418029785156e-06, -4.781410098075867e-06, -4.198402166366577e-06, -3.6153942346572876e-06, -3.032386302947998e-06, -2.4493783712387085e-06, -1.866370439529419e-06, -1.2833625078201294e-06, -7.003545761108398e-07, -1.1734664440155029e-07, 4.6566128730773926e-07, 1.0486692190170288e-06, 1.6316771507263184e-06, 2.214685082435608e-06, 2.7976930141448975e-06, 3.380700945854187e-06, 3.9637088775634766e-06, 4.546716809272766e-06, 5.129724740982056e-06, 5.712732672691345e-06, 6.295740604400635e-06, 6.878748536109924e-06, 7.461756467819214e-06, 8.044764399528503e-06, 8.627772331237793e-06, 9.210780262947083e-06, 9.793788194656372e-06, 1.0376796126365662e-05, 1.0959804058074951e-05, 1.154281198978424e-05, 1.212581992149353e-05, 1.270882785320282e-05, 1.329183578491211e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 1.0, 3.0, 13.0, 18.0, 24.0, 30.0, 45.0, 83.0, 116.0, 202.0, 319.0, 577.0, 961.0, 2246.0, 6880.0, 27927.0, 370542.0, 593106.0, 32701.0, 7664.0, 2456.0, 1169.0, 561.0, 333.0, 191.0, 138.0, 87.0, 61.0, 37.0, 32.0, 15.0, 13.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06524658203125, -0.06333017349243164, -0.06141376495361328, -0.05949735641479492, -0.05758094787597656, -0.0556645393371582, -0.053748130798339844, -0.051831722259521484, -0.049915313720703125, -0.047998905181884766, -0.046082496643066406, -0.04416608810424805, -0.04224967956542969, -0.04033327102661133, -0.03841686248779297, -0.03650045394897461, -0.03458404541015625, -0.03266763687133789, -0.03075122833251953, -0.028834819793701172, -0.026918411254882812, -0.025002002716064453, -0.023085594177246094, -0.021169185638427734, -0.019252777099609375, -0.017336368560791016, -0.015419960021972656, -0.013503551483154297, -0.011587142944335938, -0.009670734405517578, -0.007754325866699219, -0.005837917327880859, -0.0039215087890625, -0.0020051002502441406, -8.869171142578125e-05, 0.0018277168273925781, 0.0037441253662109375, 0.005660533905029297, 0.007576942443847656, 0.009493350982666016, 0.011409759521484375, 0.013326168060302734, 0.015242576599121094, 0.017158985137939453, 0.019075393676757812, 0.020991802215576172, 0.02290821075439453, 0.02482461929321289, 0.02674102783203125, 0.02865743637084961, 0.03057384490966797, 0.03249025344848633, 0.03440666198730469, 0.03632307052612305, 0.038239479064941406, 0.040155887603759766, 0.042072296142578125, 0.043988704681396484, 0.045905113220214844, 0.0478215217590332, 0.04973793029785156, 0.05165433883666992, 0.05357074737548828, 0.05548715591430664, 0.057403564453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 5.0, 22.0, 16.0, 31.0, 92.0, 247.0, 345.0, 117.0, 43.0, 26.0, 10.0, 12.0, 8.0, 3.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0169525146484375, -0.016371488571166992, -0.015790462493896484, -0.015209436416625977, -0.014628410339355469, -0.014047384262084961, -0.013466358184814453, -0.012885332107543945, -0.012304306030273438, -0.01172327995300293, -0.011142253875732422, -0.010561227798461914, -0.009980201721191406, -0.009399175643920898, -0.00881814956665039, -0.008237123489379883, -0.007656097412109375, -0.007075071334838867, -0.006494045257568359, -0.0059130191802978516, -0.005331993103027344, -0.004750967025756836, -0.004169940948486328, -0.0035889148712158203, -0.0030078887939453125, -0.0024268627166748047, -0.0018458366394042969, -0.001264810562133789, -0.0006837844848632812, -0.00010275840759277344, 0.0004782676696777344, 0.0010592937469482422, 0.00164031982421875, 0.002221345901489258, 0.0028023719787597656, 0.0033833980560302734, 0.003964424133300781, 0.004545450210571289, 0.005126476287841797, 0.005707502365112305, 0.0062885284423828125, 0.00686955451965332, 0.007450580596923828, 0.008031606674194336, 0.008612632751464844, 0.009193658828735352, 0.00977468490600586, 0.010355710983276367, 0.010936737060546875, 0.011517763137817383, 0.01209878921508789, 0.012679815292358398, 0.013260841369628906, 0.013841867446899414, 0.014422893524169922, 0.01500391960144043, 0.015584945678710938, 0.016165971755981445, 0.016746997833251953, 0.01732802391052246, 0.01790904998779297, 0.018490076065063477, 0.019071102142333984, 0.019652128219604492, 0.020233154296875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 2.0, 6.0, 7.0, 19.0, 17.0, 24.0, 34.0, 43.0, 60.0, 99.0, 101.0, 96.0, 106.0, 102.0, 68.0, 59.0, 46.0, 33.0, 30.0, 19.0, 19.0, 10.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8477249145507812, -1.7932186126708984, -1.7387123107910156, -1.6842060089111328, -1.62969970703125, -1.5751934051513672, -1.5206869840621948, -1.466180682182312, -1.4116743803024292, -1.3571680784225464, -1.3026617765426636, -1.2481554746627808, -1.1936490535736084, -1.1391427516937256, -1.0846364498138428, -1.03013014793396, -0.9756238460540771, -0.9211175441741943, -0.8666112422943115, -0.8121048808097839, -0.7575985789299011, -0.7030922770500183, -0.6485859155654907, -0.5940796136856079, -0.5395733118057251, -0.4850670099258423, -0.4305606782436371, -0.3760543465614319, -0.3215480446815491, -0.26704174280166626, -0.21253541111946106, -0.15802907943725586, -0.1035226583480835, -0.04901634156703949, 0.005489975214004517, 0.05999629199504852, 0.11450260877609253, 0.16900891065597534, 0.22351524233818054, 0.27802157402038574, 0.33252787590026855, 0.38703417778015137, 0.44154050946235657, 0.49604684114456177, 0.5505531430244446, 0.6050594449043274, 0.659565806388855, 0.7140721082687378, 0.7685784101486206, 0.8230847120285034, 0.8775910139083862, 0.9320973753929138, 0.9866036772727966, 1.0411100387573242, 1.095616340637207, 1.1501226425170898, 1.2046289443969727, 1.2591352462768555, 1.3136415481567383, 1.368147850036621, 1.422654151916504, 1.4771604537963867, 1.531666874885559, 1.586173176765442, 1.6406794786453247]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 3.0, 2.0, 7.0, 5.0, 6.0, 12.0, 10.0, 19.0, 20.0, 27.0, 26.0, 32.0, 35.0, 36.0, 49.0, 67.0, 50.0, 66.0, 55.0, 45.0, 45.0, 49.0, 43.0, 43.0, 42.0, 45.0, 26.0, 28.0, 27.0, 23.0, 11.0, 7.0, 12.0, 5.0, 7.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0488290786743164, -1.0135501623153687, -0.9782712459564209, -0.9429923295974731, -0.9077134132385254, -0.8724344968795776, -0.8371555209159851, -0.8018766045570374, -0.7665976881980896, -0.7313187718391418, -0.6960398554801941, -0.6607609391212463, -0.6254819631576538, -0.590203046798706, -0.5549241304397583, -0.5196452140808105, -0.4843662977218628, -0.44908738136291504, -0.4138084650039673, -0.37852951884269714, -0.3432506024837494, -0.30797168612480164, -0.2726927399635315, -0.23741382360458374, -0.202134907245636, -0.16685599088668823, -0.13157705962657928, -0.09629813581705093, -0.06101921200752258, -0.02574029564857483, 0.009538635611534119, 0.044817566871643066, 0.08009636402130127, 0.11537528783082962, 0.15065421164035797, 0.18593314290046692, 0.22121205925941467, 0.2564909756183624, 0.29176992177963257, 0.3270488381385803, 0.3623277544975281, 0.39760667085647583, 0.4328855872154236, 0.4681645333766937, 0.5034434795379639, 0.5387223958969116, 0.5740013122558594, 0.6092802286148071, 0.6445591449737549, 0.6798380613327026, 0.7151169776916504, 0.7503958940505981, 0.7856748104095459, 0.8209537267684937, 0.8562327027320862, 0.8915116190910339, 0.9267905354499817, 0.9620694518089294, 0.9973483681678772, 1.0326273441314697, 1.0679062604904175, 1.1031851768493652, 1.138464093208313, 1.1737430095672607, 1.2090219259262085]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 6.0, 9.0, 15.0, 12.0, 27.0, 25.0, 39.0, 56.0, 88.0, 120.0, 170.0, 243.0, 411.0, 569.0, 873.0, 1394.0, 2344.0, 4056.0, 7595.0, 15329.0, 35175.0, 90598.0, 278615.0, 389781.0, 130692.0, 47975.0, 19991.0, 9659.0, 5059.0, 2739.0, 1730.0, 1082.0, 647.0, 470.0, 304.0, 216.0, 124.0, 84.0, 75.0, 52.0, 31.0, 18.0, 16.0, 15.0, 12.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0], "bins": [-1.14453125, -1.106597900390625, -1.06866455078125, -1.030731201171875, -0.9927978515625, -0.954864501953125, -0.91693115234375, -0.878997802734375, -0.841064453125, -0.803131103515625, -0.76519775390625, -0.727264404296875, -0.6893310546875, -0.651397705078125, -0.61346435546875, -0.575531005859375, -0.53759765625, -0.499664306640625, -0.46173095703125, -0.423797607421875, -0.3858642578125, -0.347930908203125, -0.30999755859375, -0.272064208984375, -0.234130859375, -0.196197509765625, -0.15826416015625, -0.120330810546875, -0.0823974609375, -0.044464111328125, -0.00653076171875, 0.031402587890625, 0.0693359375, 0.107269287109375, 0.14520263671875, 0.183135986328125, 0.2210693359375, 0.259002685546875, 0.29693603515625, 0.334869384765625, 0.372802734375, 0.410736083984375, 0.44866943359375, 0.486602783203125, 0.5245361328125, 0.562469482421875, 0.60040283203125, 0.638336181640625, 0.67626953125, 0.714202880859375, 0.75213623046875, 0.790069580078125, 0.8280029296875, 0.865936279296875, 0.90386962890625, 0.941802978515625, 0.979736328125, 1.017669677734375, 1.05560302734375, 1.093536376953125, 1.1314697265625, 1.169403076171875, 1.20733642578125, 1.245269775390625, 1.283203125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 9.0, 7.0, 16.0, 22.0, 27.0, 21.0, 33.0, 40.0, 42.0, 53.0, 55.0, 53.0, 69.0, 69.0, 57.0, 64.0, 40.0, 57.0, 44.0, 49.0, 29.0, 30.0, 19.0, 25.0, 17.0, 6.0, 6.0, 7.0, 6.0, 5.0, 6.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.634765625, -2.551300048828125, -2.46783447265625, -2.384368896484375, -2.3009033203125, -2.217437744140625, -2.13397216796875, -2.050506591796875, -1.967041015625, -1.883575439453125, -1.80010986328125, -1.716644287109375, -1.6331787109375, -1.549713134765625, -1.46624755859375, -1.382781982421875, -1.29931640625, -1.215850830078125, -1.13238525390625, -1.048919677734375, -0.9654541015625, -0.881988525390625, -0.79852294921875, -0.715057373046875, -0.631591796875, -0.548126220703125, -0.46466064453125, -0.381195068359375, -0.2977294921875, -0.214263916015625, -0.13079833984375, -0.047332763671875, 0.0361328125, 0.119598388671875, 0.20306396484375, 0.286529541015625, 0.3699951171875, 0.453460693359375, 0.53692626953125, 0.620391845703125, 0.703857421875, 0.787322998046875, 0.87078857421875, 0.954254150390625, 1.0377197265625, 1.121185302734375, 1.20465087890625, 1.288116455078125, 1.37158203125, 1.455047607421875, 1.53851318359375, 1.621978759765625, 1.7054443359375, 1.788909912109375, 1.87237548828125, 1.955841064453125, 2.039306640625, 2.122772216796875, 2.20623779296875, 2.289703369140625, 2.3731689453125, 2.456634521484375, 2.54010009765625, 2.623565673828125, 2.70703125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 5.0, 7.0, 9.0, 7.0, 10.0, 18.0, 20.0, 44.0, 47.0, 82.0, 126.0, 266.0, 571.0, 1476.0, 4900.0, 22498.0, 159509.0, 728295.0, 107671.0, 16809.0, 3951.0, 1192.0, 465.0, 227.0, 118.0, 66.0, 54.0, 29.0, 23.0, 20.0, 8.0, 8.0, 7.0, 4.0, 3.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.869140625, -2.79034423828125, -2.7115478515625, -2.63275146484375, -2.553955078125, -2.47515869140625, -2.3963623046875, -2.31756591796875, -2.23876953125, -2.15997314453125, -2.0811767578125, -2.00238037109375, -1.923583984375, -1.84478759765625, -1.7659912109375, -1.68719482421875, -1.6083984375, -1.52960205078125, -1.4508056640625, -1.37200927734375, -1.293212890625, -1.21441650390625, -1.1356201171875, -1.05682373046875, -0.97802734375, -0.89923095703125, -0.8204345703125, -0.74163818359375, -0.662841796875, -0.58404541015625, -0.5052490234375, -0.42645263671875, -0.34765625, -0.26885986328125, -0.1900634765625, -0.11126708984375, -0.032470703125, 0.04632568359375, 0.1251220703125, 0.20391845703125, 0.28271484375, 0.36151123046875, 0.4403076171875, 0.51910400390625, 0.597900390625, 0.67669677734375, 0.7554931640625, 0.83428955078125, 0.9130859375, 0.99188232421875, 1.0706787109375, 1.14947509765625, 1.228271484375, 1.30706787109375, 1.3858642578125, 1.46466064453125, 1.54345703125, 1.62225341796875, 1.7010498046875, 1.77984619140625, 1.858642578125, 1.93743896484375, 2.0162353515625, 2.09503173828125, 2.173828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 5.0, 6.0, 16.0, 14.0, 24.0, 16.0, 24.0, 28.0, 51.0, 41.0, 39.0, 46.0, 58.0, 64.0, 72.0, 78.0, 52.0, 56.0, 53.0, 48.0, 50.0, 33.0, 28.0, 19.0, 15.0, 12.0, 13.0, 7.0, 17.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.259765625, -3.150726318359375, -3.04168701171875, -2.932647705078125, -2.8236083984375, -2.714569091796875, -2.60552978515625, -2.496490478515625, -2.387451171875, -2.278411865234375, -2.16937255859375, -2.060333251953125, -1.9512939453125, -1.842254638671875, -1.73321533203125, -1.624176025390625, -1.51513671875, -1.406097412109375, -1.29705810546875, -1.188018798828125, -1.0789794921875, -0.969940185546875, -0.86090087890625, -0.751861572265625, -0.642822265625, -0.533782958984375, -0.42474365234375, -0.315704345703125, -0.2066650390625, -0.097625732421875, 0.01141357421875, 0.120452880859375, 0.2294921875, 0.338531494140625, 0.44757080078125, 0.556610107421875, 0.6656494140625, 0.774688720703125, 0.88372802734375, 0.992767333984375, 1.101806640625, 1.210845947265625, 1.31988525390625, 1.428924560546875, 1.5379638671875, 1.647003173828125, 1.75604248046875, 1.865081787109375, 1.97412109375, 2.083160400390625, 2.19219970703125, 2.301239013671875, 2.4102783203125, 2.519317626953125, 2.62835693359375, 2.737396240234375, 2.846435546875, 2.955474853515625, 3.06451416015625, 3.173553466796875, 3.2825927734375, 3.391632080078125, 3.50067138671875, 3.609710693359375, 3.71875]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 1.0, 1.0, 10.0, 9.0, 18.0, 18.0, 21.0, 41.0, 97.0, 184.0, 489.0, 1585.0, 6787.0, 42629.0, 360916.0, 560830.0, 62454.0, 9395.0, 1965.0, 598.0, 260.0, 110.0, 54.0, 21.0, 16.0, 11.0, 6.0, 12.0, 5.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1611328125, -1.132171630859375, -1.10321044921875, -1.074249267578125, -1.0452880859375, -1.016326904296875, -0.98736572265625, -0.958404541015625, -0.929443359375, -0.900482177734375, -0.87152099609375, -0.842559814453125, -0.8135986328125, -0.784637451171875, -0.75567626953125, -0.726715087890625, -0.69775390625, -0.668792724609375, -0.63983154296875, -0.610870361328125, -0.5819091796875, -0.552947998046875, -0.52398681640625, -0.495025634765625, -0.466064453125, -0.437103271484375, -0.40814208984375, -0.379180908203125, -0.3502197265625, -0.321258544921875, -0.29229736328125, -0.263336181640625, -0.234375, -0.205413818359375, -0.17645263671875, -0.147491455078125, -0.1185302734375, -0.089569091796875, -0.06060791015625, -0.031646728515625, -0.002685546875, 0.026275634765625, 0.05523681640625, 0.084197998046875, 0.1131591796875, 0.142120361328125, 0.17108154296875, 0.200042724609375, 0.22900390625, 0.257965087890625, 0.28692626953125, 0.315887451171875, 0.3448486328125, 0.373809814453125, 0.40277099609375, 0.431732177734375, 0.460693359375, 0.489654541015625, 0.51861572265625, 0.547576904296875, 0.5765380859375, 0.605499267578125, 0.63446044921875, 0.663421630859375, 0.6923828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 8.0, 8.0, 11.0, 22.0, 28.0, 33.0, 34.0, 45.0, 59.0, 108.0, 154.0, 125.0, 116.0, 68.0, 50.0, 34.0, 19.0, 23.0, 13.0, 9.0, 8.0, 8.0, 8.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011599063873291016, -0.00011209957301616669, -0.00010820850729942322, -0.00010431744158267975, -0.00010042637586593628, -9.653531014919281e-05, -9.264424443244934e-05, -8.875317871570587e-05, -8.48621129989624e-05, -8.097104728221893e-05, -7.707998156547546e-05, -7.3188915848732e-05, -6.929785013198853e-05, -6.540678441524506e-05, -6.151571869850159e-05, -5.762465298175812e-05, -5.373358726501465e-05, -4.984252154827118e-05, -4.595145583152771e-05, -4.206039011478424e-05, -3.816932439804077e-05, -3.42782586812973e-05, -3.0387192964553833e-05, -2.6496127247810364e-05, -2.2605061531066895e-05, -1.8713995814323425e-05, -1.4822930097579956e-05, -1.0931864380836487e-05, -7.040798664093018e-06, -3.1497329473495483e-06, 7.413327693939209e-07, 4.63239848613739e-06, 8.52346420288086e-06, 1.2414529919624329e-05, 1.6305595636367798e-05, 2.0196661353111267e-05, 2.4087727069854736e-05, 2.7978792786598206e-05, 3.1869858503341675e-05, 3.5760924220085144e-05, 3.965198993682861e-05, 4.354305565357208e-05, 4.743412137031555e-05, 5.132518708705902e-05, 5.521625280380249e-05, 5.910731852054596e-05, 6.299838423728943e-05, 6.68894499540329e-05, 7.078051567077637e-05, 7.467158138751984e-05, 7.85626471042633e-05, 8.245371282100677e-05, 8.634477853775024e-05, 9.023584425449371e-05, 9.412690997123718e-05, 9.801797568798065e-05, 0.00010190904140472412, 0.00010580010712146759, 0.00010969117283821106, 0.00011358223855495453, 0.000117473304271698, 0.00012136436998844147, 0.00012525543570518494, 0.0001291465014219284, 0.00013303756713867188]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 4.0, 14.0, 10.0, 19.0, 46.0, 85.0, 168.0, 369.0, 955.0, 2934.0, 10664.0, 48856.0, 259021.0, 576210.0, 117735.0, 23039.0, 5545.0, 1770.0, 606.0, 239.0, 129.0, 61.0, 22.0, 11.0, 11.0, 12.0, 6.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57666015625, -0.5518722534179688, -0.5270843505859375, -0.5022964477539062, -0.477508544921875, -0.45272064208984375, -0.4279327392578125, -0.40314483642578125, -0.37835693359375, -0.35356903076171875, -0.3287811279296875, -0.30399322509765625, -0.279205322265625, -0.25441741943359375, -0.2296295166015625, -0.20484161376953125, -0.1800537109375, -0.15526580810546875, -0.1304779052734375, -0.10569000244140625, -0.080902099609375, -0.05611419677734375, -0.0313262939453125, -0.00653839111328125, 0.01824951171875, 0.04303741455078125, 0.0678253173828125, 0.09261322021484375, 0.117401123046875, 0.14218902587890625, 0.1669769287109375, 0.19176483154296875, 0.216552734375, 0.24134063720703125, 0.2661285400390625, 0.29091644287109375, 0.315704345703125, 0.34049224853515625, 0.3652801513671875, 0.39006805419921875, 0.41485595703125, 0.43964385986328125, 0.4644317626953125, 0.48921966552734375, 0.514007568359375, 0.5387954711914062, 0.5635833740234375, 0.5883712768554688, 0.6131591796875, 0.6379470825195312, 0.6627349853515625, 0.6875228881835938, 0.712310791015625, 0.7370986938476562, 0.7618865966796875, 0.7866744995117188, 0.81146240234375, 0.8362503051757812, 0.8610382080078125, 0.8858261108398438, 0.910614013671875, 0.9354019165039062, 0.9601898193359375, 0.9849777221679688, 1.009765625]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 10.0, 20.0, 19.0, 22.0, 30.0, 46.0, 48.0, 76.0, 97.0, 115.0, 119.0, 94.0, 75.0, 49.0, 34.0, 25.0, 29.0, 19.0, 16.0, 14.0, 6.0, 7.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.47802734375, -0.46613311767578125, -0.4542388916015625, -0.44234466552734375, -0.430450439453125, -0.41855621337890625, -0.4066619873046875, -0.39476776123046875, -0.38287353515625, -0.37097930908203125, -0.3590850830078125, -0.34719085693359375, -0.335296630859375, -0.32340240478515625, -0.3115081787109375, -0.29961395263671875, -0.2877197265625, -0.27582550048828125, -0.2639312744140625, -0.25203704833984375, -0.240142822265625, -0.22824859619140625, -0.2163543701171875, -0.20446014404296875, -0.19256591796875, -0.18067169189453125, -0.1687774658203125, -0.15688323974609375, -0.144989013671875, -0.13309478759765625, -0.1212005615234375, -0.10930633544921875, -0.097412109375, -0.08551788330078125, -0.0736236572265625, -0.06172943115234375, -0.049835205078125, -0.03794097900390625, -0.0260467529296875, -0.01415252685546875, -0.00225830078125, 0.00963592529296875, 0.0215301513671875, 0.03342437744140625, 0.045318603515625, 0.05721282958984375, 0.0691070556640625, 0.08100128173828125, 0.0928955078125, 0.10478973388671875, 0.1166839599609375, 0.12857818603515625, 0.140472412109375, 0.15236663818359375, 0.1642608642578125, 0.17615509033203125, 0.18804931640625, 0.19994354248046875, 0.2118377685546875, 0.22373199462890625, 0.235626220703125, 0.24752044677734375, 0.2594146728515625, 0.27130889892578125, 0.283203125]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 20.0, 27.0, 70.0, 91.0, 159.0, 185.0, 172.0, 124.0, 75.0, 32.0, 20.0, 15.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-10.549402236938477, -10.336786270141602, -10.124170303344727, -9.911555290222168, -9.698939323425293, -9.486323356628418, -9.27370834350586, -9.061092376708984, -8.84847640991211, -8.635860443115234, -8.42324447631836, -8.2106294631958, -7.998013496398926, -7.785397529602051, -7.572782039642334, -7.360166549682617, -7.147550582885742, -6.934934616088867, -6.72231912612915, -6.509703636169434, -6.297087669372559, -6.084471702575684, -5.871856212615967, -5.65924072265625, -5.446624755859375, -5.2340087890625, -5.021393299102783, -4.808777809143066, -4.596161842346191, -4.383545875549316, -4.1709303855896, -3.9583146572113037, -3.745698928833008, -3.533083200454712, -3.320467472076416, -3.10785174369812, -2.895236015319824, -2.6826202869415283, -2.4700045585632324, -2.2573888301849365, -2.0447731018066406, -1.8321573734283447, -1.6195416450500488, -1.406925916671753, -1.194310188293457, -0.9816944599151611, -0.7690787315368652, -0.5564630031585693, -0.34384727478027344, -0.13123154640197754, 0.08138418197631836, 0.29399991035461426, 0.5066156387329102, 0.719231367111206, 0.931847095489502, 1.1444628238677979, 1.3570785522460938, 1.5696942806243896, 1.7823100090026855, 1.9949257373809814, 2.2075414657592773, 2.4201571941375732, 2.632772922515869, 2.845388650894165, 3.058004379272461]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 2.0, 7.0, 9.0, 10.0, 6.0, 10.0, 7.0, 12.0, 16.0, 18.0, 27.0, 24.0, 34.0, 35.0, 41.0, 41.0, 31.0, 47.0, 34.0, 47.0, 55.0, 57.0, 46.0, 38.0, 37.0, 38.0, 40.0, 48.0, 27.0, 19.0, 22.0, 23.0, 12.0, 16.0, 15.0, 12.0, 14.0, 6.0, 7.0, 7.0, 2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.779695510864258, -4.633615970611572, -4.4875359535217285, -4.341456413269043, -4.195376873016357, -4.049297332763672, -3.903217315673828, -3.7571377754211426, -3.611057996749878, -3.4649782180786133, -3.3188986778259277, -3.172818899154663, -3.0267391204833984, -2.880659580230713, -2.7345798015594482, -2.5885000228881836, -2.442420482635498, -2.2963407039642334, -2.150261163711548, -2.004181385040283, -1.858101725578308, -1.712022066116333, -1.5659422874450684, -1.4198626279830933, -1.2737829685211182, -1.127703309059143, -0.9816235899925232, -0.8355438709259033, -0.6894642114639282, -0.5433845520019531, -0.39730483293533325, -0.2512251138687134, -0.10514593124389648, 0.040933758020401, 0.1870134472846985, 0.33309313654899597, 0.47917282581329346, 0.6252524852752686, 0.7713322043418884, 0.9174119234085083, 1.0634915828704834, 1.2095712423324585, 1.3556509017944336, 1.5017306804656982, 1.6478103399276733, 1.7938899993896484, 1.939969778060913, 2.0860495567321777, 2.2321290969848633, 2.378208875656128, 2.5242884159088135, 2.670368194580078, 2.8164477348327637, 2.9625275135040283, 3.108607292175293, 3.2546868324279785, 3.400766611099243, 3.546846389770508, 3.6929259300231934, 3.839005708694458, 3.9850854873657227, 4.131165027618408, 4.277244567871094, 4.4233245849609375, 4.569404125213623]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 5.0, 7.0, 7.0, 10.0, 10.0, 18.0, 19.0, 18.0, 33.0, 47.0, 50.0, 95.0, 154.0, 307.0, 741.0, 2495.0, 12315.0, 109973.0, 3092476.0, 921751.0, 44405.0, 6656.0, 1561.0, 521.0, 218.0, 116.0, 79.0, 48.0, 26.0, 22.0, 27.0, 22.0, 10.0, 10.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.85546875, -3.744720458984375, -3.63397216796875, -3.523223876953125, -3.4124755859375, -3.301727294921875, -3.19097900390625, -3.080230712890625, -2.969482421875, -2.858734130859375, -2.74798583984375, -2.637237548828125, -2.5264892578125, -2.415740966796875, -2.30499267578125, -2.194244384765625, -2.08349609375, -1.972747802734375, -1.86199951171875, -1.751251220703125, -1.6405029296875, -1.529754638671875, -1.41900634765625, -1.308258056640625, -1.197509765625, -1.086761474609375, -0.97601318359375, -0.865264892578125, -0.7545166015625, -0.643768310546875, -0.53302001953125, -0.422271728515625, -0.3115234375, -0.200775146484375, -0.09002685546875, 0.020721435546875, 0.1314697265625, 0.242218017578125, 0.35296630859375, 0.463714599609375, 0.574462890625, 0.685211181640625, 0.79595947265625, 0.906707763671875, 1.0174560546875, 1.128204345703125, 1.23895263671875, 1.349700927734375, 1.46044921875, 1.571197509765625, 1.68194580078125, 1.792694091796875, 1.9034423828125, 2.014190673828125, 2.12493896484375, 2.235687255859375, 2.346435546875, 2.457183837890625, 2.56793212890625, 2.678680419921875, 2.7894287109375, 2.900177001953125, 3.01092529296875, 3.121673583984375, 3.232421875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 9.0, 9.0, 22.0, 21.0, 35.0, 39.0, 68.0, 77.0, 69.0, 80.0, 105.0, 81.0, 85.0, 72.0, 74.0, 53.0, 38.0, 19.0, 12.0, 17.0, 5.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.009765625, -1.9576873779296875, -1.905609130859375, -1.8535308837890625, -1.80145263671875, -1.7493743896484375, -1.697296142578125, -1.6452178955078125, -1.5931396484375, -1.5410614013671875, -1.488983154296875, -1.4369049072265625, -1.38482666015625, -1.3327484130859375, -1.280670166015625, -1.2285919189453125, -1.176513671875, -1.1244354248046875, -1.072357177734375, -1.0202789306640625, -0.96820068359375, -0.9161224365234375, -0.864044189453125, -0.8119659423828125, -0.7598876953125, -0.7078094482421875, -0.655731201171875, -0.6036529541015625, -0.55157470703125, -0.4994964599609375, -0.447418212890625, -0.3953399658203125, -0.34326171875, -0.2911834716796875, -0.239105224609375, -0.1870269775390625, -0.13494873046875, -0.0828704833984375, -0.030792236328125, 0.0212860107421875, 0.0733642578125, 0.1254425048828125, 0.177520751953125, 0.2295989990234375, 0.28167724609375, 0.3337554931640625, 0.385833740234375, 0.4379119873046875, 0.489990234375, 0.5420684814453125, 0.594146728515625, 0.6462249755859375, 0.69830322265625, 0.7503814697265625, 0.802459716796875, 0.8545379638671875, 0.9066162109375, 0.9586944580078125, 1.010772705078125, 1.0628509521484375, 1.11492919921875, 1.1670074462890625, 1.219085693359375, 1.2711639404296875, 1.3232421875]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 10.0, 13.0, 20.0, 26.0, 28.0, 58.0, 99.0, 129.0, 234.0, 560.0, 1399.0, 6674.0, 59527.0, 1340362.0, 2663804.0, 107742.0, 10292.0, 1918.0, 641.0, 299.0, 168.0, 100.0, 56.0, 36.0, 24.0, 13.0, 19.0, 11.0, 5.0, 7.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1171875, -4.003173828125, -3.88916015625, -3.775146484375, -3.6611328125, -3.547119140625, -3.43310546875, -3.319091796875, -3.205078125, -3.091064453125, -2.97705078125, -2.863037109375, -2.7490234375, -2.635009765625, -2.52099609375, -2.406982421875, -2.29296875, -2.178955078125, -2.06494140625, -1.950927734375, -1.8369140625, -1.722900390625, -1.60888671875, -1.494873046875, -1.380859375, -1.266845703125, -1.15283203125, -1.038818359375, -0.9248046875, -0.810791015625, -0.69677734375, -0.582763671875, -0.46875, -0.354736328125, -0.24072265625, -0.126708984375, -0.0126953125, 0.101318359375, 0.21533203125, 0.329345703125, 0.443359375, 0.557373046875, 0.67138671875, 0.785400390625, 0.8994140625, 1.013427734375, 1.12744140625, 1.241455078125, 1.35546875, 1.469482421875, 1.58349609375, 1.697509765625, 1.8115234375, 1.925537109375, 2.03955078125, 2.153564453125, 2.267578125, 2.381591796875, 2.49560546875, 2.609619140625, 2.7236328125, 2.837646484375, 2.95166015625, 3.065673828125, 3.1796875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 6.0, 8.0, 4.0, 8.0, 12.0, 9.0, 13.0, 29.0, 42.0, 64.0, 71.0, 86.0, 154.0, 175.0, 229.0, 308.0, 427.0, 523.0, 476.0, 363.0, 309.0, 185.0, 164.0, 115.0, 78.0, 66.0, 51.0, 26.0, 14.0, 18.0, 20.0, 9.0, 5.0, 7.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.58642578125, -0.5652542114257812, -0.5440826416015625, -0.5229110717773438, -0.501739501953125, -0.48056793212890625, -0.4593963623046875, -0.43822479248046875, -0.41705322265625, -0.39588165283203125, -0.3747100830078125, -0.35353851318359375, -0.332366943359375, -0.31119537353515625, -0.2900238037109375, -0.26885223388671875, -0.2476806640625, -0.22650909423828125, -0.2053375244140625, -0.18416595458984375, -0.162994384765625, -0.14182281494140625, -0.1206512451171875, -0.09947967529296875, -0.07830810546875, -0.05713653564453125, -0.0359649658203125, -0.01479339599609375, 0.006378173828125, 0.02754974365234375, 0.0487213134765625, 0.06989288330078125, 0.091064453125, 0.11223602294921875, 0.1334075927734375, 0.15457916259765625, 0.175750732421875, 0.19692230224609375, 0.2180938720703125, 0.23926544189453125, 0.26043701171875, 0.28160858154296875, 0.3027801513671875, 0.32395172119140625, 0.345123291015625, 0.36629486083984375, 0.3874664306640625, 0.40863800048828125, 0.4298095703125, 0.45098114013671875, 0.4721527099609375, 0.49332427978515625, 0.514495849609375, 0.5356674194335938, 0.5568389892578125, 0.5780105590820312, 0.59918212890625, 0.6203536987304688, 0.6415252685546875, 0.6626968383789062, 0.683868408203125, 0.7050399780273438, 0.7262115478515625, 0.7473831176757812, 0.7685546875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 3.0, 7.0, 4.0, 11.0, 10.0, 22.0, 14.0, 18.0, 24.0, 31.0, 26.0, 45.0, 41.0, 52.0, 48.0, 60.0, 41.0, 33.0, 64.0, 48.0, 42.0, 36.0, 43.0, 37.0, 37.0, 33.0, 26.0, 32.0, 20.0, 20.0, 11.0, 16.0, 9.0, 9.0, 7.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7298526763916016, -1.6803669929504395, -1.630881428718567, -1.5813957452774048, -1.5319101810455322, -1.4824244976043701, -1.432938814163208, -1.383453130722046, -1.3339675664901733, -1.2844818830490112, -1.2349963188171387, -1.1855106353759766, -1.1360249519348145, -1.086539387702942, -1.0370537042617798, -0.9875680804252625, -0.9380824565887451, -0.8885968327522278, -0.8391112089157104, -0.7896255254745483, -0.740139901638031, -0.6906542778015137, -0.6411685943603516, -0.5916829705238342, -0.5421973466873169, -0.49271172285079956, -0.44322606921195984, -0.3937404155731201, -0.3442547917366028, -0.29476916790008545, -0.24528351426124573, -0.195797860622406, -0.14631211757659912, -0.0968264788389206, -0.047340840101242065, 0.0021447986364364624, 0.05163043737411499, 0.10111607611179352, 0.15060171484947205, 0.20008736848831177, 0.2495729923248291, 0.29905861616134644, 0.34854426980018616, 0.3980299234390259, 0.4475155472755432, 0.49700117111206055, 0.5464868545532227, 0.59597247838974, 0.6454581022262573, 0.6949437260627747, 0.744429349899292, 0.7939150333404541, 0.8434006571769714, 0.8928862810134888, 0.9423719644546509, 0.9918575882911682, 1.0413432121276855, 1.0908288955688477, 1.1403144598007202, 1.1898001432418823, 1.2392857074737549, 1.288771390914917, 1.338257074356079, 1.3877427577972412, 1.4372283220291138]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 6.0, 6.0, 7.0, 12.0, 14.0, 16.0, 18.0, 17.0, 23.0, 26.0, 26.0, 27.0, 40.0, 19.0, 41.0, 40.0, 32.0, 43.0, 45.0, 41.0, 34.0, 32.0, 32.0, 48.0, 31.0, 37.0, 22.0, 43.0, 30.0, 34.0, 22.0, 17.0, 20.0, 21.0, 11.0, 12.0, 9.0, 6.0, 11.0, 4.0, 5.0, 8.0, 2.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.4794626235961914, -1.4339599609375, -1.3884572982788086, -1.3429546356201172, -1.2974519729614258, -1.2519493103027344, -1.206446647644043, -1.1609439849853516, -1.1154413223266602, -1.0699386596679688, -1.0244359970092773, -0.9789333343505859, -0.9334306716918945, -0.8879280090332031, -0.8424252867698669, -0.7969226241111755, -0.7514199018478394, -0.705917239189148, -0.6604145765304565, -0.6149119138717651, -0.5694092512130737, -0.5239065885543823, -0.47840386629104614, -0.43290120363235474, -0.38739854097366333, -0.3418958783149719, -0.2963932156562805, -0.2508905231952667, -0.20538786053657532, -0.1598851978778839, -0.11438250541687012, -0.06887984275817871, -0.023377299308776855, 0.022125370800495148, 0.06762804090976715, 0.11313071846961975, 0.15863338112831116, 0.20413604378700256, 0.24963873624801636, 0.29514139890670776, 0.34064406156539917, 0.3861467242240906, 0.431649386882782, 0.4771520793437958, 0.5226547718048096, 0.568157434463501, 0.6136600971221924, 0.6591627597808838, 0.7046654224395752, 0.7501680850982666, 0.795670747756958, 0.8411734104156494, 0.8866760730743408, 0.9321787357330322, 0.9776814579963684, 1.023184061050415, 1.0686867237091064, 1.1141893863677979, 1.1596920490264893, 1.2051947116851807, 1.250697374343872, 1.2962000370025635, 1.3417026996612549, 1.3872053623199463, 1.4327081441879272]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 6.0, 11.0, 9.0, 15.0, 22.0, 21.0, 26.0, 32.0, 58.0, 65.0, 84.0, 139.0, 191.0, 264.0, 412.0, 652.0, 1598.0, 13286.0, 660340.0, 359684.0, 8409.0, 1331.0, 636.0, 353.0, 262.0, 190.0, 119.0, 85.0, 65.0, 47.0, 34.0, 22.0, 19.0, 19.0, 18.0, 4.0, 8.0, 4.0, 3.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56298828125, -0.5441741943359375, -0.525360107421875, -0.5065460205078125, -0.48773193359375, -0.4689178466796875, -0.450103759765625, -0.4312896728515625, -0.4124755859375, -0.3936614990234375, -0.374847412109375, -0.3560333251953125, -0.33721923828125, -0.3184051513671875, -0.299591064453125, -0.2807769775390625, -0.261962890625, -0.2431488037109375, -0.224334716796875, -0.2055206298828125, -0.18670654296875, -0.1678924560546875, -0.149078369140625, -0.1302642822265625, -0.1114501953125, -0.0926361083984375, -0.073822021484375, -0.0550079345703125, -0.03619384765625, -0.0173797607421875, 0.001434326171875, 0.0202484130859375, 0.0390625, 0.0578765869140625, 0.076690673828125, 0.0955047607421875, 0.11431884765625, 0.1331329345703125, 0.151947021484375, 0.1707611083984375, 0.1895751953125, 0.2083892822265625, 0.227203369140625, 0.2460174560546875, 0.26483154296875, 0.2836456298828125, 0.302459716796875, 0.3212738037109375, 0.340087890625, 0.3589019775390625, 0.377716064453125, 0.3965301513671875, 0.41534423828125, 0.4341583251953125, 0.452972412109375, 0.4717864990234375, 0.4906005859375, 0.5094146728515625, 0.528228759765625, 0.5470428466796875, 0.56585693359375, 0.5846710205078125, 0.603485107421875, 0.6222991943359375, 0.64111328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 2.0, 5.0, 10.0, 10.0, 12.0, 18.0, 14.0, 11.0, 28.0, 25.0, 25.0, 38.0, 34.0, 39.0, 36.0, 49.0, 30.0, 46.0, 50.0, 47.0, 47.0, 48.0, 38.0, 32.0, 34.0, 33.0, 41.0, 35.0, 20.0, 28.0, 20.0, 18.0, 13.0, 13.0, 13.0, 12.0, 8.0, 9.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.234375, -1.198455810546875, -1.16253662109375, -1.126617431640625, -1.0906982421875, -1.054779052734375, -1.01885986328125, -0.982940673828125, -0.947021484375, -0.911102294921875, -0.87518310546875, -0.839263916015625, -0.8033447265625, -0.767425537109375, -0.73150634765625, -0.695587158203125, -0.65966796875, -0.623748779296875, -0.58782958984375, -0.551910400390625, -0.5159912109375, -0.480072021484375, -0.44415283203125, -0.408233642578125, -0.372314453125, -0.336395263671875, -0.30047607421875, -0.264556884765625, -0.2286376953125, -0.192718505859375, -0.15679931640625, -0.120880126953125, -0.0849609375, -0.049041748046875, -0.01312255859375, 0.022796630859375, 0.0587158203125, 0.094635009765625, 0.13055419921875, 0.166473388671875, 0.202392578125, 0.238311767578125, 0.27423095703125, 0.310150146484375, 0.3460693359375, 0.381988525390625, 0.41790771484375, 0.453826904296875, 0.48974609375, 0.525665283203125, 0.56158447265625, 0.597503662109375, 0.6334228515625, 0.669342041015625, 0.70526123046875, 0.741180419921875, 0.777099609375, 0.813018798828125, 0.84893798828125, 0.884857177734375, 0.9207763671875, 0.956695556640625, 0.99261474609375, 1.028533935546875, 1.064453125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 7.0, 3.0, 5.0, 8.0, 12.0, 14.0, 14.0, 32.0, 33.0, 44.0, 39.0, 57.0, 83.0, 120.0, 145.0, 174.0, 283.0, 488.0, 1328.0, 6667.0, 55265.0, 654334.0, 297020.0, 26100.0, 3972.0, 919.0, 391.0, 246.0, 178.0, 139.0, 101.0, 78.0, 44.0, 48.0, 22.0, 26.0, 28.0, 17.0, 23.0, 10.0, 13.0, 4.0, 8.0, 6.0, 1.0, 2.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.31005859375, -0.3008918762207031, -0.29172515869140625, -0.2825584411621094, -0.2733917236328125, -0.2642250061035156, -0.25505828857421875, -0.24589157104492188, -0.236724853515625, -0.22755813598632812, -0.21839141845703125, -0.20922470092773438, -0.2000579833984375, -0.19089126586914062, -0.18172454833984375, -0.17255783081054688, -0.16339111328125, -0.15422439575195312, -0.14505767822265625, -0.13589096069335938, -0.1267242431640625, -0.11755752563476562, -0.10839080810546875, -0.09922409057617188, -0.090057373046875, -0.08089065551757812, -0.07172393798828125, -0.06255722045898438, -0.0533905029296875, -0.044223785400390625, -0.03505706787109375, -0.025890350341796875, -0.0167236328125, -0.007556915283203125, 0.00160980224609375, 0.010776519775390625, 0.0199432373046875, 0.029109954833984375, 0.03827667236328125, 0.047443389892578125, 0.056610107421875, 0.06577682495117188, 0.07494354248046875, 0.08411026000976562, 0.0932769775390625, 0.10244369506835938, 0.11161041259765625, 0.12077713012695312, 0.12994384765625, 0.13911056518554688, 0.14827728271484375, 0.15744400024414062, 0.1666107177734375, 0.17577743530273438, 0.18494415283203125, 0.19411087036132812, 0.203277587890625, 0.21244430541992188, 0.22161102294921875, 0.23077774047851562, 0.2399444580078125, 0.24911117553710938, 0.25827789306640625, 0.2674446105957031, 0.276611328125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 4.0, 5.0, 6.0, 10.0, 13.0, 9.0, 11.0, 22.0, 21.0, 37.0, 26.0, 31.0, 38.0, 29.0, 36.0, 43.0, 43.0, 42.0, 50.0, 43.0, 40.0, 57.0, 46.0, 36.0, 35.0, 38.0, 34.0, 30.0, 24.0, 20.0, 16.0, 13.0, 14.0, 16.0, 14.0, 12.0, 14.0, 8.0, 9.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.947265625, -2.856170654296875, -2.76507568359375, -2.673980712890625, -2.5828857421875, -2.491790771484375, -2.40069580078125, -2.309600830078125, -2.218505859375, -2.127410888671875, -2.03631591796875, -1.945220947265625, -1.8541259765625, -1.763031005859375, -1.67193603515625, -1.580841064453125, -1.48974609375, -1.398651123046875, -1.30755615234375, -1.216461181640625, -1.1253662109375, -1.034271240234375, -0.94317626953125, -0.852081298828125, -0.760986328125, -0.669891357421875, -0.57879638671875, -0.487701416015625, -0.3966064453125, -0.305511474609375, -0.21441650390625, -0.123321533203125, -0.0322265625, 0.058868408203125, 0.14996337890625, 0.241058349609375, 0.3321533203125, 0.423248291015625, 0.51434326171875, 0.605438232421875, 0.696533203125, 0.787628173828125, 0.87872314453125, 0.969818115234375, 1.0609130859375, 1.152008056640625, 1.24310302734375, 1.334197998046875, 1.42529296875, 1.516387939453125, 1.60748291015625, 1.698577880859375, 1.7896728515625, 1.880767822265625, 1.97186279296875, 2.062957763671875, 2.154052734375, 2.245147705078125, 2.33624267578125, 2.427337646484375, 2.5184326171875, 2.609527587890625, 2.70062255859375, 2.791717529296875, 2.8828125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 10.0, 7.0, 15.0, 13.0, 23.0, 25.0, 40.0, 52.0, 75.0, 105.0, 181.0, 344.0, 604.0, 1586.0, 15581.0, 965516.0, 59876.0, 2709.0, 787.0, 376.0, 202.0, 127.0, 99.0, 49.0, 36.0, 25.0, 26.0, 13.0, 10.0, 10.0, 9.0, 6.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.0830078125, -0.08086061477661133, -0.07871341705322266, -0.07656621932983398, -0.07441902160644531, -0.07227182388305664, -0.07012462615966797, -0.0679774284362793, -0.06583023071289062, -0.06368303298950195, -0.06153583526611328, -0.05938863754272461, -0.05724143981933594, -0.055094242095947266, -0.052947044372558594, -0.05079984664916992, -0.04865264892578125, -0.04650545120239258, -0.044358253479003906, -0.042211055755615234, -0.04006385803222656, -0.03791666030883789, -0.03576946258544922, -0.03362226486206055, -0.031475067138671875, -0.029327869415283203, -0.02718067169189453, -0.02503347396850586, -0.022886276245117188, -0.020739078521728516, -0.018591880798339844, -0.016444683074951172, -0.0142974853515625, -0.012150287628173828, -0.010003089904785156, -0.007855892181396484, -0.0057086944580078125, -0.0035614967346191406, -0.0014142990112304688, 0.0007328987121582031, 0.002880096435546875, 0.005027294158935547, 0.007174491882324219, 0.00932168960571289, 0.011468887329101562, 0.013616085052490234, 0.015763282775878906, 0.017910480499267578, 0.02005767822265625, 0.022204875946044922, 0.024352073669433594, 0.026499271392822266, 0.028646469116210938, 0.03079366683959961, 0.03294086456298828, 0.03508806228637695, 0.037235260009765625, 0.0393824577331543, 0.04152965545654297, 0.04367685317993164, 0.04582405090332031, 0.047971248626708984, 0.050118446350097656, 0.05226564407348633, 0.054412841796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 5.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 7.0, 3.0, 15.0, 8.0, 17.0, 15.0, 33.0, 52.0, 48.0, 59.0, 85.0, 84.0, 91.0, 94.0, 87.0, 70.0, 65.0, 38.0, 34.0, 23.0, 15.0, 10.0, 9.0, 8.0, 5.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.7239322662353516e-05, -2.649892121553421e-05, -2.5758519768714905e-05, -2.50181183218956e-05, -2.4277716875076294e-05, -2.353731542825699e-05, -2.2796913981437683e-05, -2.2056512534618378e-05, -2.1316111087799072e-05, -2.0575709640979767e-05, -1.983530819416046e-05, -1.9094906747341156e-05, -1.835450530052185e-05, -1.7614103853702545e-05, -1.687370240688324e-05, -1.6133300960063934e-05, -1.539289951324463e-05, -1.4652498066425323e-05, -1.3912096619606018e-05, -1.3171695172786713e-05, -1.2431293725967407e-05, -1.1690892279148102e-05, -1.0950490832328796e-05, -1.0210089385509491e-05, -9.469687938690186e-06, -8.72928649187088e-06, -7.988885045051575e-06, -7.248483598232269e-06, -6.508082151412964e-06, -5.7676807045936584e-06, -5.027279257774353e-06, -4.286877810955048e-06, -3.546476364135742e-06, -2.8060749173164368e-06, -2.0656734704971313e-06, -1.325272023677826e-06, -5.848705768585205e-07, 1.555308699607849e-07, 8.959323167800903e-07, 1.6363337635993958e-06, 2.376735210418701e-06, 3.1171366572380066e-06, 3.857538104057312e-06, 4.5979395508766174e-06, 5.338340997695923e-06, 6.078742444515228e-06, 6.819143891334534e-06, 7.559545338153839e-06, 8.299946784973145e-06, 9.04034823179245e-06, 9.780749678611755e-06, 1.052115112543106e-05, 1.1261552572250366e-05, 1.2001954019069672e-05, 1.2742355465888977e-05, 1.3482756912708282e-05, 1.4223158359527588e-05, 1.4963559806346893e-05, 1.57039612531662e-05, 1.6444362699985504e-05, 1.718476414680481e-05, 1.7925165593624115e-05, 1.866556704044342e-05, 1.9405968487262726e-05, 2.014636993408203e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 2.0, 6.0, 4.0, 17.0, 18.0, 21.0, 44.0, 50.0, 71.0, 94.0, 128.0, 189.0, 300.0, 499.0, 800.0, 1282.0, 2346.0, 4558.0, 9480.0, 24950.0, 102099.0, 645513.0, 192730.0, 38091.0, 12890.0, 5671.0, 2812.0, 1488.0, 852.0, 500.0, 328.0, 214.0, 142.0, 115.0, 77.0, 40.0, 34.0, 36.0, 16.0, 11.0, 9.0, 13.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036041259765625, -0.03482627868652344, -0.033611297607421875, -0.03239631652832031, -0.03118133544921875, -0.029966354370117188, -0.028751373291015625, -0.027536392211914062, -0.0263214111328125, -0.025106430053710938, -0.023891448974609375, -0.022676467895507812, -0.02146148681640625, -0.020246505737304688, -0.019031524658203125, -0.017816543579101562, -0.0166015625, -0.015386581420898438, -0.014171600341796875, -0.012956619262695312, -0.01174163818359375, -0.010526657104492188, -0.009311676025390625, -0.008096694946289062, -0.0068817138671875, -0.0056667327880859375, -0.004451751708984375, -0.0032367706298828125, -0.00202178955078125, -0.0008068084716796875, 0.000408172607421875, 0.0016231536865234375, 0.002838134765625, 0.0040531158447265625, 0.005268096923828125, 0.0064830780029296875, 0.00769805908203125, 0.008913040161132812, 0.010128021240234375, 0.011343002319335938, 0.0125579833984375, 0.013772964477539062, 0.014987945556640625, 0.016202926635742188, 0.01741790771484375, 0.018632888793945312, 0.019847869873046875, 0.021062850952148438, 0.02227783203125, 0.023492813110351562, 0.024707794189453125, 0.025922775268554688, 0.02713775634765625, 0.028352737426757812, 0.029567718505859375, 0.030782699584960938, 0.0319976806640625, 0.03321266174316406, 0.034427642822265625, 0.03564262390136719, 0.03685760498046875, 0.03807258605957031, 0.039287567138671875, 0.04050254821777344, 0.041717529296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 7.0, 9.0, 7.0, 14.0, 12.0, 30.0, 54.0, 71.0, 91.0, 225.0, 160.0, 89.0, 65.0, 49.0, 23.0, 23.0, 22.0, 4.0, 5.0, 8.0, 2.0, 4.0, 3.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0107879638671875, -0.010386109352111816, -0.009984254837036133, -0.00958240032196045, -0.009180545806884766, -0.008778691291809082, -0.008376836776733398, -0.007974982261657715, -0.007573127746582031, -0.007171273231506348, -0.006769418716430664, -0.0063675642013549805, -0.005965709686279297, -0.005563855171203613, -0.00516200065612793, -0.004760146141052246, -0.0043582916259765625, -0.003956437110900879, -0.0035545825958251953, -0.0031527280807495117, -0.002750873565673828, -0.0023490190505981445, -0.001947164535522461, -0.0015453100204467773, -0.0011434555053710938, -0.0007416009902954102, -0.00033974647521972656, 6.210803985595703e-05, 0.0004639625549316406, 0.0008658170700073242, 0.0012676715850830078, 0.0016695261001586914, 0.002071380615234375, 0.0024732351303100586, 0.002875089645385742, 0.0032769441604614258, 0.0036787986755371094, 0.004080653190612793, 0.0044825077056884766, 0.00488436222076416, 0.005286216735839844, 0.005688071250915527, 0.006089925765991211, 0.0064917802810668945, 0.006893634796142578, 0.007295489311218262, 0.007697343826293945, 0.008099198341369629, 0.008501052856445312, 0.008902907371520996, 0.00930476188659668, 0.009706616401672363, 0.010108470916748047, 0.01051032543182373, 0.010912179946899414, 0.011314034461975098, 0.011715888977050781, 0.012117743492126465, 0.012519598007202148, 0.012921452522277832, 0.013323307037353516, 0.0137251615524292, 0.014127016067504883, 0.014528870582580566, 0.01493072509765625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 7.0, 5.0, 4.0, 6.0, 10.0, 15.0, 14.0, 21.0, 27.0, 23.0, 21.0, 39.0, 49.0, 50.0, 53.0, 54.0, 54.0, 55.0, 56.0, 53.0, 41.0, 50.0, 36.0, 35.0, 38.0, 37.0, 33.0, 30.0, 20.0, 13.0, 10.0, 15.0, 8.0, 8.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.136176586151123, -1.100453495979309, -1.0647305250167847, -1.0290074348449707, -0.9932844042778015, -0.9575613737106323, -0.9218382835388184, -0.8861152529716492, -0.85039222240448, -0.8146691918373108, -0.7789461612701416, -0.7432230710983276, -0.7075000405311584, -0.6717770099639893, -0.6360539197921753, -0.6003308892250061, -0.5646078586578369, -0.5288848280906677, -0.49316176772117615, -0.45743870735168457, -0.4217156767845154, -0.3859926462173462, -0.3502695858478546, -0.31454652547836304, -0.27882349491119385, -0.24310044944286346, -0.20737740397453308, -0.1716543585062027, -0.13593131303787231, -0.10020826756954193, -0.06448522210121155, -0.02876216173171997, 0.006960868835449219, 0.0426839143037796, 0.07840695977210999, 0.11413000524044037, 0.14985305070877075, 0.18557609617710114, 0.22129914164543152, 0.2570222020149231, 0.2927452325820923, 0.3284682631492615, 0.36419132351875305, 0.39991438388824463, 0.4356374144554138, 0.471360445022583, 0.507083535194397, 0.5428065657615662, 0.5785295963287354, 0.6142526268959045, 0.6499756574630737, 0.6856987476348877, 0.7214217782020569, 0.7571448087692261, 0.79286789894104, 0.8285909295082092, 0.8643139600753784, 0.9000369906425476, 0.9357600212097168, 0.9714831113815308, 1.0072062015533447, 1.0429291725158691, 1.078652262687683, 1.114375352859497, 1.1500983238220215]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 7.0, 12.0, 15.0, 10.0, 18.0, 16.0, 22.0, 33.0, 27.0, 33.0, 35.0, 31.0, 43.0, 38.0, 42.0, 53.0, 41.0, 45.0, 34.0, 35.0, 44.0, 37.0, 33.0, 36.0, 36.0, 33.0, 33.0, 28.0, 17.0, 22.0, 16.0, 11.0, 10.0, 9.0, 8.0, 6.0, 8.0, 3.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.038323998451233, -1.0054484605789185, -0.9725730419158936, -0.9396975040435791, -0.9068220257759094, -0.8739465475082397, -0.8410710692405701, -0.8081955909729004, -0.7753200531005859, -0.7424445748329163, -0.7095690965652466, -0.6766935586929321, -0.6438180804252625, -0.6109426021575928, -0.5780671238899231, -0.5451916456222534, -0.5123161673545837, -0.47944068908691406, -0.446565181016922, -0.4136897027492523, -0.38081419467926025, -0.3479387164115906, -0.3150632381439209, -0.2821877598762512, -0.24931225180625916, -0.21643675863742828, -0.1835612654685974, -0.15068578720092773, -0.11781029403209686, -0.08493480086326599, -0.052059322595596313, -0.019183829426765442, 0.01369166374206543, 0.046567153185606, 0.07944264262914658, 0.11231812834739685, 0.14519362151622772, 0.1780691146850586, 0.21094459295272827, 0.24382008612155914, 0.27669557929039, 0.3095710575580597, 0.34244656562805176, 0.37532204389572144, 0.4081975221633911, 0.4410730302333832, 0.47394850850105286, 0.5068240165710449, 0.5396994948387146, 0.5725749731063843, 0.605450451374054, 0.6383259296417236, 0.6712014675140381, 0.7040769457817078, 0.7369524240493774, 0.7698279023170471, 0.8027033805847168, 0.8355788588523865, 0.8684543371200562, 0.9013298749923706, 0.9342053532600403, 0.96708083152771, 0.9999563097953796, 1.0328317880630493, 1.0657073259353638]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 13.0, 10.0, 35.0, 33.0, 61.0, 67.0, 140.0, 189.0, 308.0, 518.0, 817.0, 1574.0, 3142.0, 6121.0, 12226.0, 25384.0, 56918.0, 140863.0, 340984.0, 271681.0, 103801.0, 43560.0, 19745.0, 9874.0, 4828.0, 2519.0, 1275.0, 764.0, 391.0, 245.0, 168.0, 113.0, 60.0, 36.0, 29.0, 19.0, 9.0, 8.0, 9.0, 1.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5966796875, -1.5449066162109375, -1.493133544921875, -1.4413604736328125, -1.38958740234375, -1.3378143310546875, -1.286041259765625, -1.2342681884765625, -1.1824951171875, -1.1307220458984375, -1.078948974609375, -1.0271759033203125, -0.97540283203125, -0.9236297607421875, -0.871856689453125, -0.8200836181640625, -0.768310546875, -0.7165374755859375, -0.664764404296875, -0.6129913330078125, -0.56121826171875, -0.5094451904296875, -0.457672119140625, -0.4058990478515625, -0.3541259765625, -0.3023529052734375, -0.250579833984375, -0.1988067626953125, -0.14703369140625, -0.0952606201171875, -0.043487548828125, 0.0082855224609375, 0.06005859375, 0.1118316650390625, 0.163604736328125, 0.2153778076171875, 0.26715087890625, 0.3189239501953125, 0.370697021484375, 0.4224700927734375, 0.4742431640625, 0.5260162353515625, 0.577789306640625, 0.6295623779296875, 0.68133544921875, 0.7331085205078125, 0.784881591796875, 0.8366546630859375, 0.888427734375, 0.9402008056640625, 0.991973876953125, 1.0437469482421875, 1.09552001953125, 1.1472930908203125, 1.199066162109375, 1.2508392333984375, 1.3026123046875, 1.3543853759765625, 1.406158447265625, 1.4579315185546875, 1.50970458984375, 1.5614776611328125, 1.613250732421875, 1.6650238037109375, 1.716796875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 5.0, 5.0, 5.0, 7.0, 11.0, 17.0, 16.0, 23.0, 26.0, 25.0, 28.0, 27.0, 39.0, 30.0, 45.0, 20.0, 45.0, 40.0, 42.0, 38.0, 27.0, 41.0, 45.0, 35.0, 39.0, 37.0, 28.0, 27.0, 30.0, 18.0, 28.0, 22.0, 25.0, 20.0, 10.0, 17.0, 12.0, 9.0, 5.0, 7.0, 5.0, 4.0, 2.0, 1.0, 7.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5546875, -1.5033721923828125, -1.452056884765625, -1.4007415771484375, -1.34942626953125, -1.2981109619140625, -1.246795654296875, -1.1954803466796875, -1.1441650390625, -1.0928497314453125, -1.041534423828125, -0.9902191162109375, -0.93890380859375, -0.8875885009765625, -0.836273193359375, -0.7849578857421875, -0.733642578125, -0.6823272705078125, -0.631011962890625, -0.5796966552734375, -0.52838134765625, -0.4770660400390625, -0.425750732421875, -0.3744354248046875, -0.3231201171875, -0.2718048095703125, -0.220489501953125, -0.1691741943359375, -0.11785888671875, -0.0665435791015625, -0.015228271484375, 0.0360870361328125, 0.08740234375, 0.1387176513671875, 0.190032958984375, 0.2413482666015625, 0.29266357421875, 0.3439788818359375, 0.395294189453125, 0.4466094970703125, 0.4979248046875, 0.5492401123046875, 0.600555419921875, 0.6518707275390625, 0.70318603515625, 0.7545013427734375, 0.805816650390625, 0.8571319580078125, 0.908447265625, 0.9597625732421875, 1.011077880859375, 1.0623931884765625, 1.11370849609375, 1.1650238037109375, 1.216339111328125, 1.2676544189453125, 1.3189697265625, 1.3702850341796875, 1.421600341796875, 1.4729156494140625, 1.52423095703125, 1.5755462646484375, 1.626861572265625, 1.6781768798828125, 1.7294921875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 9.0, 14.0, 21.0, 35.0, 45.0, 73.0, 114.0, 163.0, 286.0, 502.0, 911.0, 1636.0, 3043.0, 6006.0, 11964.0, 25472.0, 57665.0, 146688.0, 356169.0, 263354.0, 97119.0, 39954.0, 18445.0, 9011.0, 4506.0, 2303.0, 1293.0, 718.0, 405.0, 251.0, 151.0, 87.0, 46.0, 32.0, 32.0, 9.0, 16.0, 6.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7421875, -1.692108154296875, -1.64202880859375, -1.591949462890625, -1.5418701171875, -1.491790771484375, -1.44171142578125, -1.391632080078125, -1.341552734375, -1.291473388671875, -1.24139404296875, -1.191314697265625, -1.1412353515625, -1.091156005859375, -1.04107666015625, -0.990997314453125, -0.94091796875, -0.890838623046875, -0.84075927734375, -0.790679931640625, -0.7406005859375, -0.690521240234375, -0.64044189453125, -0.590362548828125, -0.540283203125, -0.490203857421875, -0.44012451171875, -0.390045166015625, -0.3399658203125, -0.289886474609375, -0.23980712890625, -0.189727783203125, -0.1396484375, -0.089569091796875, -0.03948974609375, 0.010589599609375, 0.0606689453125, 0.110748291015625, 0.16082763671875, 0.210906982421875, 0.260986328125, 0.311065673828125, 0.36114501953125, 0.411224365234375, 0.4613037109375, 0.511383056640625, 0.56146240234375, 0.611541748046875, 0.66162109375, 0.711700439453125, 0.76177978515625, 0.811859130859375, 0.8619384765625, 0.912017822265625, 0.96209716796875, 1.012176513671875, 1.062255859375, 1.112335205078125, 1.16241455078125, 1.212493896484375, 1.2625732421875, 1.312652587890625, 1.36273193359375, 1.412811279296875, 1.462890625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 5.0, 6.0, 5.0, 9.0, 8.0, 10.0, 20.0, 13.0, 17.0, 27.0, 34.0, 38.0, 35.0, 38.0, 47.0, 43.0, 59.0, 59.0, 61.0, 58.0, 36.0, 48.0, 56.0, 54.0, 31.0, 32.0, 22.0, 29.0, 22.0, 16.0, 22.0, 11.0, 10.0, 11.0, 5.0, 6.0, 1.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.67578125, -2.5816650390625, -2.487548828125, -2.3934326171875, -2.29931640625, -2.2052001953125, -2.111083984375, -2.0169677734375, -1.9228515625, -1.8287353515625, -1.734619140625, -1.6405029296875, -1.54638671875, -1.4522705078125, -1.358154296875, -1.2640380859375, -1.169921875, -1.0758056640625, -0.981689453125, -0.8875732421875, -0.79345703125, -0.6993408203125, -0.605224609375, -0.5111083984375, -0.4169921875, -0.3228759765625, -0.228759765625, -0.1346435546875, -0.04052734375, 0.0535888671875, 0.147705078125, 0.2418212890625, 0.3359375, 0.4300537109375, 0.524169921875, 0.6182861328125, 0.71240234375, 0.8065185546875, 0.900634765625, 0.9947509765625, 1.0888671875, 1.1829833984375, 1.277099609375, 1.3712158203125, 1.46533203125, 1.5594482421875, 1.653564453125, 1.7476806640625, 1.841796875, 1.9359130859375, 2.030029296875, 2.1241455078125, 2.21826171875, 2.3123779296875, 2.406494140625, 2.5006103515625, 2.5947265625, 2.6888427734375, 2.782958984375, 2.8770751953125, 2.97119140625, 3.0653076171875, 3.159423828125, 3.2535400390625, 3.34765625]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 1.0, 6.0, 8.0, 15.0, 20.0, 25.0, 41.0, 69.0, 84.0, 158.0, 269.0, 368.0, 632.0, 981.0, 1531.0, 2562.0, 4242.0, 7028.0, 12027.0, 20825.0, 36561.0, 67082.0, 123531.0, 202302.0, 228087.0, 150137.0, 83717.0, 44882.0, 25039.0, 14684.0, 8434.0, 5078.0, 3133.0, 1856.0, 1143.0, 733.0, 447.0, 290.0, 171.0, 125.0, 81.0, 47.0, 44.0, 27.0, 18.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3154296875, -0.30562591552734375, -0.2958221435546875, -0.28601837158203125, -0.276214599609375, -0.26641082763671875, -0.2566070556640625, -0.24680328369140625, -0.23699951171875, -0.22719573974609375, -0.2173919677734375, -0.20758819580078125, -0.197784423828125, -0.18798065185546875, -0.1781768798828125, -0.16837310791015625, -0.1585693359375, -0.14876556396484375, -0.1389617919921875, -0.12915802001953125, -0.119354248046875, -0.10955047607421875, -0.0997467041015625, -0.08994293212890625, -0.08013916015625, -0.07033538818359375, -0.0605316162109375, -0.05072784423828125, -0.040924072265625, -0.03112030029296875, -0.0213165283203125, -0.01151275634765625, -0.001708984375, 0.00809478759765625, 0.0178985595703125, 0.02770233154296875, 0.037506103515625, 0.04730987548828125, 0.0571136474609375, 0.06691741943359375, 0.07672119140625, 0.08652496337890625, 0.0963287353515625, 0.10613250732421875, 0.115936279296875, 0.12574005126953125, 0.1355438232421875, 0.14534759521484375, 0.1551513671875, 0.16495513916015625, 0.1747589111328125, 0.18456268310546875, 0.194366455078125, 0.20417022705078125, 0.2139739990234375, 0.22377777099609375, 0.23358154296875, 0.24338531494140625, 0.2531890869140625, 0.26299285888671875, 0.272796630859375, 0.28260040283203125, 0.2924041748046875, 0.30220794677734375, 0.31201171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 7.0, 7.0, 7.0, 13.0, 6.0, 10.0, 23.0, 22.0, 41.0, 43.0, 57.0, 57.0, 93.0, 92.0, 93.0, 79.0, 77.0, 49.0, 36.0, 36.0, 39.0, 19.0, 22.0, 12.0, 17.0, 5.0, 10.0, 6.0, 1.0, 5.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0001442432403564453, -0.00014044996351003647, -0.00013665668666362762, -0.00013286340981721878, -0.00012907013297080994, -0.0001252768561244011, -0.00012148357927799225, -0.0001176903024315834, -0.00011389702558517456, -0.00011010374873876572, -0.00010631047189235687, -0.00010251719504594803, -9.872391819953918e-05, -9.493064135313034e-05, -9.11373645067215e-05, -8.734408766031265e-05, -8.355081081390381e-05, -7.975753396749496e-05, -7.596425712108612e-05, -7.217098027467728e-05, -6.837770342826843e-05, -6.458442658185959e-05, -6.0791149735450745e-05, -5.69978728890419e-05, -5.320459604263306e-05, -4.941131919622421e-05, -4.561804234981537e-05, -4.1824765503406525e-05, -3.803148865699768e-05, -3.423821181058884e-05, -3.0444934964179993e-05, -2.665165811777115e-05, -2.2858381271362305e-05, -1.906510442495346e-05, -1.5271827578544617e-05, -1.1478550732135773e-05, -7.685273885726929e-06, -3.891997039318085e-06, -9.872019290924072e-08, 3.6945566534996033e-06, 7.487833499908447e-06, 1.1281110346317291e-05, 1.5074387192726135e-05, 1.886766403913498e-05, 2.2660940885543823e-05, 2.6454217731952667e-05, 3.024749457836151e-05, 3.4040771424770355e-05, 3.78340482711792e-05, 4.162732511758804e-05, 4.542060196399689e-05, 4.921387881040573e-05, 5.3007155656814575e-05, 5.680043250322342e-05, 6.059370934963226e-05, 6.438698619604111e-05, 6.818026304244995e-05, 7.19735398888588e-05, 7.576681673526764e-05, 7.956009358167648e-05, 8.335337042808533e-05, 8.714664727449417e-05, 9.093992412090302e-05, 9.473320096731186e-05, 9.85264778137207e-05]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 6.0, 18.0, 17.0, 23.0, 22.0, 49.0, 75.0, 89.0, 150.0, 236.0, 364.0, 617.0, 954.0, 1890.0, 3515.0, 7106.0, 14854.0, 33763.0, 80647.0, 194683.0, 349000.0, 206932.0, 86155.0, 35598.0, 15869.0, 7485.0, 3777.0, 1991.0, 1031.0, 605.0, 347.0, 213.0, 125.0, 100.0, 76.0, 60.0, 36.0, 18.0, 19.0, 13.0, 10.0, 3.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51171875, -0.4959907531738281, -0.48026275634765625, -0.4645347595214844, -0.4488067626953125, -0.4330787658691406, -0.41735076904296875, -0.4016227722167969, -0.385894775390625, -0.3701667785644531, -0.35443878173828125, -0.3387107849121094, -0.3229827880859375, -0.3072547912597656, -0.29152679443359375, -0.2757987976074219, -0.26007080078125, -0.24434280395507812, -0.22861480712890625, -0.21288681030273438, -0.1971588134765625, -0.18143081665039062, -0.16570281982421875, -0.14997482299804688, -0.134246826171875, -0.11851882934570312, -0.10279083251953125, -0.08706283569335938, -0.0713348388671875, -0.055606842041015625, -0.03987884521484375, -0.024150848388671875, -0.0084228515625, 0.007305145263671875, 0.02303314208984375, 0.038761138916015625, 0.0544891357421875, 0.07021713256835938, 0.08594512939453125, 0.10167312622070312, 0.117401123046875, 0.13312911987304688, 0.14885711669921875, 0.16458511352539062, 0.1803131103515625, 0.19604110717773438, 0.21176910400390625, 0.22749710083007812, 0.24322509765625, 0.2589530944824219, 0.27468109130859375, 0.2904090881347656, 0.3061370849609375, 0.3218650817871094, 0.33759307861328125, 0.3533210754394531, 0.369049072265625, 0.3847770690917969, 0.40050506591796875, 0.4162330627441406, 0.4319610595703125, 0.4476890563964844, 0.46341705322265625, 0.4791450500488281, 0.494873046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 4.0, 2.0, 3.0, 3.0, 6.0, 7.0, 8.0, 8.0, 10.0, 18.0, 8.0, 14.0, 21.0, 26.0, 41.0, 51.0, 55.0, 67.0, 69.0, 77.0, 58.0, 73.0, 65.0, 69.0, 45.0, 37.0, 34.0, 29.0, 17.0, 20.0, 11.0, 11.0, 6.0, 10.0, 7.0, 2.0, 2.0, 5.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.347412109375, -0.3375434875488281, -0.32767486572265625, -0.3178062438964844, -0.3079376220703125, -0.2980690002441406, -0.28820037841796875, -0.2783317565917969, -0.268463134765625, -0.2585945129394531, -0.24872589111328125, -0.23885726928710938, -0.2289886474609375, -0.21912002563476562, -0.20925140380859375, -0.19938278198242188, -0.18951416015625, -0.17964553833007812, -0.16977691650390625, -0.15990829467773438, -0.1500396728515625, -0.14017105102539062, -0.13030242919921875, -0.12043380737304688, -0.110565185546875, -0.10069656372070312, -0.09082794189453125, -0.08095932006835938, -0.0710906982421875, -0.061222076416015625, -0.05135345458984375, -0.041484832763671875, -0.0316162109375, -0.021747589111328125, -0.01187896728515625, -0.002010345458984375, 0.0078582763671875, 0.017726898193359375, 0.02759552001953125, 0.037464141845703125, 0.047332763671875, 0.057201385498046875, 0.06707000732421875, 0.07693862915039062, 0.0868072509765625, 0.09667587280273438, 0.10654449462890625, 0.11641311645507812, 0.12628173828125, 0.13615036010742188, 0.14601898193359375, 0.15588760375976562, 0.1657562255859375, 0.17562484741210938, 0.18549346923828125, 0.19536209106445312, 0.205230712890625, 0.21509933471679688, 0.22496795654296875, 0.23483657836914062, 0.2447052001953125, 0.2545738220214844, 0.26444244384765625, 0.2743110656738281, 0.2841796875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 9.0, 18.0, 25.0, 39.0, 71.0, 113.0, 134.0, 175.0, 132.0, 109.0, 86.0, 53.0, 23.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-8.450699806213379, -8.231928825378418, -8.013157844543457, -7.794387340545654, -7.575616359710693, -7.356845378875732, -7.13807487487793, -6.919303894042969, -6.700532913208008, -6.481761932373047, -6.262990951538086, -6.044220447540283, -5.825449466705322, -5.606678485870361, -5.387907981872559, -5.169137001037598, -4.950366020202637, -4.731595039367676, -4.512824058532715, -4.294053554534912, -4.075282573699951, -3.8565115928649902, -3.6377408504486084, -3.4189701080322266, -3.2001991271972656, -2.9814281463623047, -2.762657403945923, -2.543886661529541, -2.32511568069458, -2.106344699859619, -1.8875739574432373, -1.668803095817566, -1.4500317573547363, -1.231260895729065, -1.0124900341033936, -0.7937191724777222, -0.5749483108520508, -0.3561774492263794, -0.137406587600708, 0.08136427402496338, 0.30013513565063477, 0.5189059972763062, 0.7376768589019775, 0.9564477205276489, 1.1752185821533203, 1.3939894437789917, 1.612760305404663, 1.8315311670303345, 2.050302028656006, 2.269073009490967, 2.4878437519073486, 2.7066144943237305, 2.9253854751586914, 3.1441564559936523, 3.362927198410034, 3.581697940826416, 3.800468921661377, 4.019239902496338, 4.238010406494141, 4.456781387329102, 4.6755523681640625, 4.894323348999023, 5.113094329833984, 5.331864833831787, 5.550635814666748]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 8.0, 9.0, 12.0, 14.0, 13.0, 17.0, 22.0, 26.0, 26.0, 23.0, 37.0, 43.0, 37.0, 52.0, 49.0, 36.0, 46.0, 53.0, 42.0, 53.0, 44.0, 34.0, 40.0, 31.0, 26.0, 21.0, 33.0, 26.0, 26.0, 24.0, 20.0, 12.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.492680549621582, -5.3330488204956055, -5.173417091369629, -5.013785362243652, -4.854153633117676, -4.694521427154541, -4.5348896980285645, -4.375257968902588, -4.215626239776611, -4.055994510650635, -3.896362781524658, -3.7367308139801025, -3.577099084854126, -3.4174673557281494, -3.2578353881835938, -3.098203659057617, -2.9385719299316406, -2.778940200805664, -2.6193084716796875, -2.459676504135132, -2.3000447750091553, -2.1404130458831787, -1.9807811975479126, -1.8211493492126465, -1.66151762008667, -1.5018858909606934, -1.3422540426254272, -1.1826221942901611, -1.0229904651641846, -0.8633586764335632, -0.7037268877029419, -0.5440950393676758, -0.3844637870788574, -0.22483199834823608, -0.06520020961761475, 0.09443157911300659, 0.25406336784362793, 0.41369515657424927, 0.5733269453048706, 0.7329587936401367, 0.8925905227661133, 1.0522222518920898, 1.211854100227356, 1.371485948562622, 1.5311176776885986, 1.6907494068145752, 1.8503812551498413, 2.0100131034851074, 2.169644832611084, 2.3292765617370605, 2.488908290863037, 2.6485402584075928, 2.8081719875335693, 2.967803716659546, 3.1274356842041016, 3.287067413330078, 3.4466991424560547, 3.6063308715820312, 3.765962600708008, 3.9255945682525635, 4.085226058959961, 4.244858264923096, 4.404489994049072, 4.564121723175049, 4.723753452301025]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 4.0, 2.0, 4.0, 7.0, 17.0, 19.0, 25.0, 32.0, 44.0, 43.0, 85.0, 126.0, 192.0, 283.0, 432.0, 595.0, 969.0, 1495.0, 1970.0, 3302.0, 1030856.0, 3446.0, 2166.0, 1477.0, 1016.0, 668.0, 431.0, 266.0, 203.0, 123.0, 100.0, 71.0, 42.0, 23.0, 20.0, 15.0, 13.0, 6.0, 8.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.910651206970215, -5.729031085968018, -5.54741096496582, -5.365791320800781, -5.184171199798584, -5.002551078796387, -4.8209309577941895, -4.639310836791992, -4.457691192626953, -4.276071071624756, -4.094450950622559, -3.9128310680389404, -3.7312111854553223, -3.549591064453125, -3.3679709434509277, -3.1863508224487305, -3.004730701446533, -2.823110580444336, -2.6414906978607178, -2.4598705768585205, -2.2782506942749023, -2.096630573272705, -1.9150104522705078, -1.7333904504776, -1.5517704486846924, -1.3701504468917847, -1.188530445098877, -1.0069103240966797, -0.825290322303772, -0.6436703205108643, -0.462050199508667, -0.2804301977157593, -0.09881019592285156, 0.08280983567237854, 0.26442986726760864, 0.44604992866516113, 0.6276699304580688, 0.8092899322509766, 0.9909100532531738, 1.1725300550460815, 1.3541500568389893, 1.535770058631897, 1.7173900604248047, 1.899010181427002, 2.080630302429199, 2.2622501850128174, 2.4438703060150146, 2.625490188598633, 2.80711030960083, 2.9887304306030273, 3.1703503131866455, 3.3519704341888428, 3.533590316772461, 3.715210437774658, 3.8968305587768555, 4.078450679779053, 4.26007080078125, 4.441690921783447, 4.6233110427856445, 4.804930686950684, 4.986550807952881, 5.168170928955078, 5.349791049957275, 5.531411170959473, 5.713030815124512]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 7.0, 1.0, 11.0, 12.0, 14.0, 34.0, 107.0, 158.0, 318.0, 1182.0, 5324.0, 32747.0, 51411452.0, 15596.0, 3159.0, 740.0, 228.0, 101.0, 63.0, 24.0, 20.0, 13.0, 8.0, 6.0, 2.0, 3.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.699848175048828, -18.13774871826172, -17.575647354125977, -17.013547897338867, -16.451446533203125, -15.8893461227417, -15.327245712280273, -14.765146255493164, -14.203044891357422, -13.640944480895996, -13.07884407043457, -12.516743659973145, -11.954643249511719, -11.392542839050293, -10.830442428588867, -10.268342971801758, -9.706242561340332, -9.144142150878906, -8.58204174041748, -8.019941329956055, -7.457840919494629, -6.895740509033203, -6.3336405754089355, -5.77154016494751, -5.209439754486084, -4.647339344024658, -4.085238933563232, -3.5231387615203857, -2.96103835105896, -2.398937940597534, -1.8368377685546875, -1.2747373580932617, -0.7126369476318359, -0.15053659677505493, 0.4115637540817261, 0.9736640453338623, 1.535764455795288, 2.097864866256714, 2.6599650382995605, 3.2220654487609863, 3.784165859222412, 4.346266269683838, 4.908366680145264, 5.470466613769531, 6.032567024230957, 6.594667434692383, 7.156767845153809, 7.718868255615234, 8.28096866607666, 8.843069076538086, 9.405169486999512, 9.967269897460938, 10.529370307922363, 11.091470718383789, 11.653570175170898, 12.21567153930664, 12.77777099609375, 13.339871406555176, 13.901971817016602, 14.464072227478027, 15.026172637939453, 15.588273048400879, 16.150373458862305, 16.712472915649414, 17.274574279785156]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 6.0, 11.0, 14.0, 27.0, 28.0, 25.0, 54.0, 66.0, 85.0, 136.0, 208.0, 307.0, 436.0, 696.0, 1023.0, 1654.0, 2763.0, 4689.0, 7614.0, 13185.0, 22819.0, 41072.0, 75037.0, 139334.0, 265750.0, 496416.0, 3871275.0, 609954.0, 343609.0, 179963.0, 94550.0, 50867.0, 28105.0, 15969.0, 9247.0, 5568.0, 3333.0, 2071.0, 1281.0, 816.0, 511.0, 282.0, 216.0, 127.0, 65.0, 54.0, 27.0, 14.0, 25.0, 14.0, 5.0, 12.0, 5.0, 3.0, 2.0, 3.0, 2.0], "bins": [-0.146728515625, -0.14237403869628906, -0.13801956176757812, -0.1336650848388672, -0.12931060791015625, -0.12495613098144531, -0.12060165405273438, -0.11624717712402344, -0.1118927001953125, -0.10753822326660156, -0.10318374633789062, -0.09882926940917969, -0.09447479248046875, -0.09012031555175781, -0.08576583862304688, -0.08141136169433594, -0.077056884765625, -0.07270240783691406, -0.06834793090820312, -0.06399345397949219, -0.05963897705078125, -0.05528450012207031, -0.050930023193359375, -0.04657554626464844, -0.0422210693359375, -0.03786659240722656, -0.033512115478515625, -0.029157638549804688, -0.02480316162109375, -0.020448684692382812, -0.016094207763671875, -0.011739730834960938, -0.00738525390625, -0.0030307769775390625, 0.001323699951171875, 0.0056781768798828125, 0.01003265380859375, 0.014387130737304688, 0.018741607666015625, 0.023096084594726562, 0.0274505615234375, 0.03180503845214844, 0.036159515380859375, 0.04051399230957031, 0.04486846923828125, 0.04922294616699219, 0.053577423095703125, 0.05793190002441406, 0.062286376953125, 0.06664085388183594, 0.07099533081054688, 0.07534980773925781, 0.07970428466796875, 0.08405876159667969, 0.08841323852539062, 0.09276771545410156, 0.0971221923828125, 0.10147666931152344, 0.10583114624023438, 0.11018562316894531, 0.11454010009765625, 0.11889457702636719, 0.12324905395507812, 0.12760353088378906, 0.1319580078125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 4.0, 2.0, 7.0, 6.0, 13.0, 13.0, 16.0, 22.0, 28.0, 20.0, 24.0, 34.0, 30.0, 41.0, 46.0, 36.0, 38.0, 38.0, 42.0, 1055.0, 40.0, 44.0, 44.0, 34.0, 42.0, 36.0, 39.0, 28.0, 39.0, 29.0, 21.0, 18.0, 22.0, 16.0, 10.0, 13.0, 4.0, 8.0, 4.0, 3.0, 1.0, 6.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-8.6484375, -8.38037109375, -8.1123046875, -7.84423828125, -7.576171875, -7.30810546875, -7.0400390625, -6.77197265625, -6.50390625, -6.23583984375, -5.9677734375, -5.69970703125, -5.431640625, -5.16357421875, -4.8955078125, -4.62744140625, -4.359375, -4.09130859375, -3.8232421875, -3.55517578125, -3.287109375, -3.01904296875, -2.7509765625, -2.48291015625, -2.21484375, -1.94677734375, -1.6787109375, -1.41064453125, -1.142578125, -0.87451171875, -0.6064453125, -0.33837890625, -0.0703125, 0.19775390625, 0.4658203125, 0.73388671875, 1.001953125, 1.27001953125, 1.5380859375, 1.80615234375, 2.07421875, 2.34228515625, 2.6103515625, 2.87841796875, 3.146484375, 3.41455078125, 3.6826171875, 3.95068359375, 4.21875, 4.48681640625, 4.7548828125, 5.02294921875, 5.291015625, 5.55908203125, 5.8271484375, 6.09521484375, 6.36328125, 6.63134765625, 6.8994140625, 7.16748046875, 7.435546875, 7.70361328125, 7.9716796875, 8.23974609375, 8.5078125]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 3.0, 11.0, 1.0, 4.0, 9.0, 19.0, 30.0, 48.0, 60.0, 116.0, 143.0, 250.0, 358.0, 531.0, 805.0, 1222.0, 2570.0, 6687.0, 22855.0, 89944.0, 433485.0, 4693817.0, 818634.0, 163260.0, 38451.0, 10527.0, 3376.0, 1609.0, 896.0, 546.0, 379.0, 254.0, 131.0, 110.0, 71.0, 57.0, 39.0, 41.0, 15.0, 17.0, 6.0, 14.0, 8.0, 3.0, 10.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.27587890625, -0.26815032958984375, -0.2604217529296875, -0.25269317626953125, -0.244964599609375, -0.23723602294921875, -0.2295074462890625, -0.22177886962890625, -0.21405029296875, -0.20632171630859375, -0.1985931396484375, -0.19086456298828125, -0.183135986328125, -0.17540740966796875, -0.1676788330078125, -0.15995025634765625, -0.1522216796875, -0.14449310302734375, -0.1367645263671875, -0.12903594970703125, -0.121307373046875, -0.11357879638671875, -0.1058502197265625, -0.09812164306640625, -0.09039306640625, -0.08266448974609375, -0.0749359130859375, -0.06720733642578125, -0.059478759765625, -0.05175018310546875, -0.0440216064453125, -0.03629302978515625, -0.028564453125, -0.02083587646484375, -0.0131072998046875, -0.00537872314453125, 0.002349853515625, 0.01007843017578125, 0.0178070068359375, 0.02553558349609375, 0.03326416015625, 0.04099273681640625, 0.0487213134765625, 0.05644989013671875, 0.064178466796875, 0.07190704345703125, 0.0796356201171875, 0.08736419677734375, 0.0950927734375, 0.10282135009765625, 0.1105499267578125, 0.11827850341796875, 0.126007080078125, 0.13373565673828125, 0.1414642333984375, 0.14919281005859375, 0.15692138671875, 0.16464996337890625, 0.1723785400390625, 0.18010711669921875, 0.187835693359375, 0.19556427001953125, 0.2032928466796875, 0.21102142333984375, 0.21875]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 5.0, 6.0, 8.0, 10.0, 18.0, 8.0, 17.0, 13.0, 26.0, 23.0, 27.0, 26.0, 36.0, 34.0, 49.0, 44.0, 66.0, 53.0, 24.0, 1069.0, 42.0, 50.0, 51.0, 41.0, 38.0, 36.0, 28.0, 26.0, 22.0, 26.0, 26.0, 15.0, 15.0, 13.0, 9.0, 5.0, 6.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.73046875, -6.51715087890625, -6.3038330078125, -6.09051513671875, -5.877197265625, -5.66387939453125, -5.4505615234375, -5.23724365234375, -5.02392578125, -4.81060791015625, -4.5972900390625, -4.38397216796875, -4.170654296875, -3.95733642578125, -3.7440185546875, -3.53070068359375, -3.3173828125, -3.10406494140625, -2.8907470703125, -2.67742919921875, -2.464111328125, -2.25079345703125, -2.0374755859375, -1.82415771484375, -1.61083984375, -1.39752197265625, -1.1842041015625, -0.97088623046875, -0.757568359375, -0.54425048828125, -0.3309326171875, -0.11761474609375, 0.095703125, 0.30902099609375, 0.5223388671875, 0.73565673828125, 0.948974609375, 1.16229248046875, 1.3756103515625, 1.58892822265625, 1.80224609375, 2.01556396484375, 2.2288818359375, 2.44219970703125, 2.655517578125, 2.86883544921875, 3.0821533203125, 3.29547119140625, 3.5087890625, 3.72210693359375, 3.9354248046875, 4.14874267578125, 4.362060546875, 4.57537841796875, 4.7886962890625, 5.00201416015625, 5.21533203125, 5.42864990234375, 5.6419677734375, 5.85528564453125, 6.068603515625, 6.28192138671875, 6.4952392578125, 6.70855712890625, 6.921875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 12.0, 5.0, 13.0, 17.0, 31.0, 23.0, 27.0, 68.0, 149.0, 237.0, 373.0, 736.0, 1381.0, 3021.0, 10314.0, 177656.0, 6010769.0, 74555.0, 6989.0, 2341.0, 1259.0, 617.0, 331.0, 203.0, 112.0, 44.0, 47.0, 29.0, 11.0, 5.0, 2.0, 10.0, 2.0, 1.0, 6.0, 1.0, 5.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 6.0], "bins": [-0.55908203125, -0.5378952026367188, -0.5167083740234375, -0.49552154541015625, -0.474334716796875, -0.45314788818359375, -0.4319610595703125, -0.41077423095703125, -0.38958740234375, -0.36840057373046875, -0.3472137451171875, -0.32602691650390625, -0.304840087890625, -0.28365325927734375, -0.2624664306640625, -0.24127960205078125, -0.2200927734375, -0.19890594482421875, -0.1777191162109375, -0.15653228759765625, -0.135345458984375, -0.11415863037109375, -0.0929718017578125, -0.07178497314453125, -0.05059814453125, -0.02941131591796875, -0.0082244873046875, 0.01296234130859375, 0.034149169921875, 0.05533599853515625, 0.0765228271484375, 0.09770965576171875, 0.118896484375, 0.14008331298828125, 0.1612701416015625, 0.18245697021484375, 0.203643798828125, 0.22483062744140625, 0.2460174560546875, 0.26720428466796875, 0.28839111328125, 0.30957794189453125, 0.3307647705078125, 0.35195159912109375, 0.373138427734375, 0.39432525634765625, 0.4155120849609375, 0.43669891357421875, 0.4578857421875, 0.47907257080078125, 0.5002593994140625, 0.5214462280273438, 0.542633056640625, 0.5638198852539062, 0.5850067138671875, 0.6061935424804688, 0.62738037109375, 0.6485671997070312, 0.6697540283203125, 0.6909408569335938, 0.712127685546875, 0.7333145141601562, 0.7545013427734375, 0.7756881713867188, 0.796875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 3.0, 13.0, 10.0, 6.0, 14.0, 26.0, 14.0, 26.0, 39.0, 38.0, 34.0, 41.0, 47.0, 47.0, 55.0, 289.0, 838.0, 53.0, 65.0, 57.0, 45.0, 43.0, 32.0, 42.0, 33.0, 29.0, 21.0, 19.0, 21.0, 7.0, 7.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.371826171875, -4.17333984375, -3.974853515625, -3.7763671875, -3.577880859375, -3.37939453125, -3.180908203125, -2.982421875, -2.783935546875, -2.58544921875, -2.386962890625, -2.1884765625, -1.989990234375, -1.79150390625, -1.593017578125, -1.39453125, -1.196044921875, -0.99755859375, -0.799072265625, -0.6005859375, -0.402099609375, -0.20361328125, -0.005126953125, 0.193359375, 0.391845703125, 0.59033203125, 0.788818359375, 0.9873046875, 1.185791015625, 1.38427734375, 1.582763671875, 1.78125, 1.979736328125, 2.17822265625, 2.376708984375, 2.5751953125, 2.773681640625, 2.97216796875, 3.170654296875, 3.369140625, 3.567626953125, 3.76611328125, 3.964599609375, 4.1630859375, 4.361572265625, 4.56005859375, 4.758544921875, 4.95703125, 5.155517578125, 5.35400390625, 5.552490234375, 5.7509765625, 5.949462890625, 6.14794921875, 6.346435546875, 6.544921875, 6.743408203125, 6.94189453125, 7.140380859375, 7.3388671875, 7.537353515625, 7.73583984375, 7.934326171875, 8.1328125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 79.0, 922.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.99751281738281, -55.61835479736328, -54.239200592041016, -52.86004638671875, -51.48088836669922, -50.10173034667969, -48.72257614135742, -47.343421936035156, -45.964263916015625, -44.585105895996094, -43.20595169067383, -41.82679748535156, -40.44763946533203, -39.0684814453125, -37.689327239990234, -36.31017303466797, -34.93101501464844, -33.551856994628906, -32.17270278930664, -30.793546676635742, -29.414390563964844, -28.035234451293945, -26.656078338623047, -25.27692222595215, -23.89776611328125, -22.51861000061035, -21.139453887939453, -19.760297775268555, -18.381141662597656, -17.001985549926758, -15.62282943725586, -14.243673324584961, -12.864517211914062, -11.485361099243164, -10.106204986572266, -8.727048873901367, -7.347892761230469, -5.96873664855957, -4.589580535888672, -3.2104244232177734, -1.831268310546875, -0.45211219787597656, 0.9270439147949219, 2.3062000274658203, 3.6853561401367188, 5.064512252807617, 6.443668365478516, 7.822824478149414, 9.201980590820312, 10.581136703491211, 11.96029281616211, 13.339448928833008, 14.718605041503906, 16.097761154174805, 17.476917266845703, 18.8560733795166, 20.2352294921875, 21.6143856048584, 22.993541717529297, 24.372697830200195, 25.751853942871094, 27.131010055541992, 28.51016616821289, 29.88932228088379, 31.268478393554688]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 21.0, 35.0, 63.0, 105.0, 140.0, 145.0, 154.0, 116.0, 101.0, 54.0, 39.0, 19.0, 9.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.09898376464844, -32.30891036987305, -31.51883316040039, -30.728757858276367, -29.938682556152344, -29.14860725402832, -28.358531951904297, -27.568456649780273, -26.77838134765625, -25.988306045532227, -25.198230743408203, -24.40815544128418, -23.618080139160156, -22.828004837036133, -22.03792953491211, -21.247854232788086, -20.457778930664062, -19.66770362854004, -18.877628326416016, -18.087553024291992, -17.29747772216797, -16.507402420043945, -15.717327117919922, -14.927251815795898, -14.137178421020508, -13.347103118896484, -12.557027816772461, -11.766952514648438, -10.976877212524414, -10.18680191040039, -9.396726608276367, -8.606651306152344, -7.81657600402832, -7.026500701904297, -6.236425399780273, -5.44635009765625, -4.656274795532227, -3.8661997318267822, -3.076124668121338, -2.2860493659973145, -1.495974063873291, -0.7058988213539124, 0.08417642116546631, 0.8742516040802002, 1.6643269062042236, 2.454402208328247, 3.2444772720336914, 4.034552574157715, 4.824627876281738, 5.614703178405762, 6.404778480529785, 7.194853782653809, 7.984929084777832, 8.775004386901855, 9.565078735351562, 10.355154037475586, 11.14522933959961, 11.935304641723633, 12.725379943847656, 13.51545524597168, 14.305530548095703, 15.095605850219727, 15.88568115234375, 16.675756454467773, 17.465831756591797]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 6.0, 17.0, 27.0, 45.0, 115.0, 7084.0, 24522.0, 4139769.0, 18877.0, 1142.0, 1294.0, 1339.0, 20.0, 8.0, 5.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.046966552734375, -0.04583334922790527, -0.04470014572143555, -0.04356694221496582, -0.042433738708496094, -0.04130053520202637, -0.04016733169555664, -0.039034128189086914, -0.03790092468261719, -0.03676772117614746, -0.035634517669677734, -0.03450131416320801, -0.03336811065673828, -0.032234907150268555, -0.031101703643798828, -0.0299685001373291, -0.028835296630859375, -0.02770209312438965, -0.026568889617919922, -0.025435686111450195, -0.02430248260498047, -0.023169279098510742, -0.022036075592041016, -0.02090287208557129, -0.019769668579101562, -0.018636465072631836, -0.01750326156616211, -0.016370058059692383, -0.015236854553222656, -0.01410365104675293, -0.012970447540283203, -0.011837244033813477, -0.01070404052734375, -0.009570837020874023, -0.008437633514404297, -0.00730443000793457, -0.006171226501464844, -0.005038022994995117, -0.0039048194885253906, -0.002771615982055664, -0.0016384124755859375, -0.0005052089691162109, 0.0006279945373535156, 0.0017611980438232422, 0.0028944015502929688, 0.004027605056762695, 0.005160808563232422, 0.0062940120697021484, 0.007427215576171875, 0.008560419082641602, 0.009693622589111328, 0.010826826095581055, 0.011960029602050781, 0.013093233108520508, 0.014226436614990234, 0.015359640121459961, 0.016492843627929688, 0.017626047134399414, 0.01875925064086914, 0.019892454147338867, 0.021025657653808594, 0.02215886116027832, 0.023292064666748047, 0.024425268173217773, 0.0255584716796875]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 8.0, 35.0, 56.0, 187.0, 454.0, 162.0, 56.0, 23.0, 12.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.026947021484375, -0.026296377182006836, -0.025645732879638672, -0.024995088577270508, -0.024344444274902344, -0.02369379997253418, -0.023043155670166016, -0.02239251136779785, -0.021741867065429688, -0.021091222763061523, -0.02044057846069336, -0.019789934158325195, -0.01913928985595703, -0.018488645553588867, -0.017838001251220703, -0.01718735694885254, -0.016536712646484375, -0.01588606834411621, -0.015235424041748047, -0.014584779739379883, -0.013934135437011719, -0.013283491134643555, -0.01263284683227539, -0.011982202529907227, -0.011331558227539062, -0.010680913925170898, -0.010030269622802734, -0.00937962532043457, -0.008728981018066406, -0.008078336715698242, -0.007427692413330078, -0.006777048110961914, -0.00612640380859375, -0.005475759506225586, -0.004825115203857422, -0.004174470901489258, -0.0035238265991210938, -0.0028731822967529297, -0.0022225379943847656, -0.0015718936920166016, -0.0009212493896484375, -0.00027060508728027344, 0.0003800392150878906, 0.0010306835174560547, 0.0016813278198242188, 0.002331972122192383, 0.002982616424560547, 0.003633260726928711, 0.004283905029296875, 0.004934549331665039, 0.005585193634033203, 0.006235837936401367, 0.006886482238769531, 0.007537126541137695, 0.00818777084350586, 0.008838415145874023, 0.009489059448242188, 0.010139703750610352, 0.010790348052978516, 0.01144099235534668, 0.012091636657714844, 0.012742280960083008, 0.013392925262451172, 0.014043569564819336, 0.0146942138671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 2.0, 7.0, 4.0, 8.0, 6.0, 10.0, 8.0, 18.0, 49.0, 54.0, 95.0, 264.0, 1655.0, 4188342.0, 3195.0, 291.0, 111.0, 62.0, 21.0, 20.0, 16.0, 16.0, 10.0, 8.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.050811767578125, -0.049202919006347656, -0.04759407043457031, -0.04598522186279297, -0.044376373291015625, -0.04276752471923828, -0.04115867614746094, -0.039549827575683594, -0.03794097900390625, -0.036332130432128906, -0.03472328186035156, -0.03311443328857422, -0.031505584716796875, -0.02989673614501953, -0.028287887573242188, -0.026679039001464844, -0.0250701904296875, -0.023461341857910156, -0.021852493286132812, -0.02024364471435547, -0.018634796142578125, -0.01702594757080078, -0.015417098999023438, -0.013808250427246094, -0.01219940185546875, -0.010590553283691406, -0.008981704711914062, -0.007372856140136719, -0.005764007568359375, -0.004155158996582031, -0.0025463104248046875, -0.0009374618530273438, 0.00067138671875, 0.0022802352905273438, 0.0038890838623046875, 0.005497932434082031, 0.007106781005859375, 0.008715629577636719, 0.010324478149414062, 0.011933326721191406, 0.01354217529296875, 0.015151023864746094, 0.016759872436523438, 0.01836872100830078, 0.019977569580078125, 0.02158641815185547, 0.023195266723632812, 0.024804115295410156, 0.0264129638671875, 0.028021812438964844, 0.029630661010742188, 0.03123950958251953, 0.032848358154296875, 0.03445720672607422, 0.03606605529785156, 0.037674903869628906, 0.03928375244140625, 0.040892601013183594, 0.04250144958496094, 0.04411029815673828, 0.045719146728515625, 0.04732799530029297, 0.04893684387207031, 0.050545692443847656, 0.052154541015625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 8.0, 4.0, 8.0, 5.0, 11.0, 11.0, 17.0, 57.0, 48.0, 109.0, 309.0, 870.0, 1671.0, 532.0, 181.0, 92.0, 49.0, 15.0, 23.0, 13.0, 13.0, 10.0, 8.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01091766357421875, -0.01056969165802002, -0.010221719741821289, -0.009873747825622559, -0.009525775909423828, -0.009177803993225098, -0.008829832077026367, -0.008481860160827637, -0.008133888244628906, -0.007785916328430176, -0.007437944412231445, -0.007089972496032715, -0.006742000579833984, -0.006394028663635254, -0.0060460567474365234, -0.005698084831237793, -0.0053501129150390625, -0.005002140998840332, -0.0046541690826416016, -0.004306197166442871, -0.003958225250244141, -0.00361025333404541, -0.0032622814178466797, -0.0029143095016479492, -0.0025663375854492188, -0.0022183656692504883, -0.0018703937530517578, -0.0015224218368530273, -0.0011744499206542969, -0.0008264780044555664, -0.00047850608825683594, -0.00013053417205810547, 0.000217437744140625, 0.0005654096603393555, 0.0009133815765380859, 0.0012613534927368164, 0.0016093254089355469, 0.0019572973251342773, 0.002305269241333008, 0.0026532411575317383, 0.0030012130737304688, 0.0033491849899291992, 0.0036971569061279297, 0.00404512882232666, 0.004393100738525391, 0.004741072654724121, 0.0050890445709228516, 0.005437016487121582, 0.0057849884033203125, 0.006132960319519043, 0.0064809322357177734, 0.006828904151916504, 0.007176876068115234, 0.007524847984313965, 0.007872819900512695, 0.008220791816711426, 0.008568763732910156, 0.008916735649108887, 0.009264707565307617, 0.009612679481506348, 0.009960651397705078, 0.010308623313903809, 0.010656595230102539, 0.01100456714630127, 0.0113525390625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 538.0, 479.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.043215200304985046, -0.03779290243983269, -0.03237060457468033, -0.02694830670952797, -0.02152600884437561, -0.01610371097922325, -0.010681413114070892, -0.005259115248918533, 0.00016318261623382568, 0.005585480481386185, 0.011007778346538544, 0.016430076211690903, 0.02185237407684326, 0.02727467194199562, 0.03269696980714798, 0.03811926767230034, 0.0435415655374527, 0.04896386340260506, 0.054386161267757416, 0.059808459132909775, 0.06523075699806213, 0.0706530511379242, 0.07607535272836685, 0.08149765431880951, 0.08691994845867157, 0.09234224259853363, 0.09776454418897629, 0.10318684577941895, 0.108609139919281, 0.11403143405914307, 0.11945373564958572, 0.12487603724002838, 0.13029834628105164, 0.1357206404209137, 0.14114293456077576, 0.146565243601799, 0.15198753774166107, 0.15740983188152313, 0.1628321409225464, 0.16825443506240845, 0.1736767292022705, 0.17909902334213257, 0.18452131748199463, 0.18994362652301788, 0.19536592066287994, 0.200788214802742, 0.20621052384376526, 0.21163281798362732, 0.21705511212348938, 0.22247740626335144, 0.2278997004032135, 0.23332200944423676, 0.23874430358409882, 0.24416659772396088, 0.24958890676498413, 0.2550112009048462, 0.26043349504470825, 0.2658557891845703, 0.2712780833244324, 0.27670037746429443, 0.2821226716041565, 0.28754499554634094, 0.292967289686203, 0.29838958382606506, 0.3038118779659271]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 4.0, 7.0, 9.0, 15.0, 10.0, 14.0, 21.0, 18.0, 19.0, 25.0, 39.0, 28.0, 30.0, 32.0, 23.0, 30.0, 31.0, 46.0, 36.0, 46.0, 36.0, 42.0, 51.0, 39.0, 37.0, 46.0, 37.0, 25.0, 37.0, 29.0, 25.0, 24.0, 18.0, 14.0, 14.0, 10.0, 7.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-0.02069830894470215, -0.020103823393583298, -0.019509335979819298, -0.018914848566055298, -0.018320363014936447, -0.017725877463817596, -0.017131390050053596, -0.016536902636289597, -0.015942417085170746, -0.01534793060272932, -0.014753444120287895, -0.01415895763784647, -0.013564471155405045, -0.01296998467296362, -0.012375498190522194, -0.011781011708080769, -0.011186525225639343, -0.010592038743197918, -0.009997552260756493, -0.009403065778315067, -0.008808579295873642, -0.008214092813432217, -0.007619606330990791, -0.007025119848549366, -0.006430633366107941, -0.005836146883666515, -0.00524166040122509, -0.004647173918783665, -0.004052687436342239, -0.003458200953900814, -0.0028637144714593887, -0.0022692279890179634, -0.001674741506576538, -0.0010802550241351128, -0.00048576854169368744, 0.00010871794074773788, 0.0007032044231891632, 0.0012976909056305885, 0.0018921773880720139, 0.002486663870513439, 0.0030811503529548645, 0.00367563683539629, 0.004270123317837715, 0.0048646098002791405, 0.005459096282720566, 0.006053582765161991, 0.0066480692476034164, 0.007242555730044842, 0.007837042212486267, 0.008431528694927692, 0.009026015177369118, 0.009620501659810543, 0.010214988142251968, 0.010809474624693394, 0.011403961107134819, 0.011998447589576244, 0.01259293407201767, 0.013187420554459095, 0.01378190703690052, 0.014376393519341946, 0.014970880001783371, 0.015565366484224796, 0.01615985296666622, 0.01675434038043022, 0.017348825931549072]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 5.0, 9.0, 12.0, 20.0, 24.0, 43.0, 66.0, 111.0, 179.0, 301.0, 885.0, 4356.0, 269804.0, 766046.0, 4939.0, 951.0, 356.0, 160.0, 70.0, 51.0, 29.0, 25.0, 25.0, 13.0, 12.0, 12.0, 13.0, 9.0, 5.0, 3.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.45703125, -1.4206314086914062, -1.3842315673828125, -1.3478317260742188, -1.311431884765625, -1.2750320434570312, -1.2386322021484375, -1.2022323608398438, -1.16583251953125, -1.1294326782226562, -1.0930328369140625, -1.0566329956054688, -1.020233154296875, -0.9838333129882812, -0.9474334716796875, -0.9110336303710938, -0.8746337890625, -0.8382339477539062, -0.8018341064453125, -0.7654342651367188, -0.729034423828125, -0.6926345825195312, -0.6562347412109375, -0.6198348999023438, -0.58343505859375, -0.5470352172851562, -0.5106353759765625, -0.47423553466796875, -0.437835693359375, -0.40143585205078125, -0.3650360107421875, -0.32863616943359375, -0.292236328125, -0.25583648681640625, -0.2194366455078125, -0.18303680419921875, -0.146636962890625, -0.11023712158203125, -0.0738372802734375, -0.03743743896484375, -0.00103759765625, 0.03536224365234375, 0.0717620849609375, 0.10816192626953125, 0.144561767578125, 0.18096160888671875, 0.2173614501953125, 0.25376129150390625, 0.2901611328125, 0.32656097412109375, 0.3629608154296875, 0.39936065673828125, 0.435760498046875, 0.47216033935546875, 0.5085601806640625, 0.5449600219726562, 0.58135986328125, 0.6177597045898438, 0.6541595458984375, 0.6905593872070312, 0.726959228515625, 0.7633590698242188, 0.7997589111328125, 0.8361587524414062, 0.87255859375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 6.0, 38.0, 55.0, 189.0, 454.0, 159.0, 56.0, 23.0, 12.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02740478515625, -0.026743173599243164, -0.026081562042236328, -0.025419950485229492, -0.024758338928222656, -0.02409672737121582, -0.023435115814208984, -0.02277350425720215, -0.022111892700195312, -0.021450281143188477, -0.02078866958618164, -0.020127058029174805, -0.01946544647216797, -0.018803834915161133, -0.018142223358154297, -0.01748061180114746, -0.016819000244140625, -0.01615738868713379, -0.015495777130126953, -0.014834165573120117, -0.014172554016113281, -0.013510942459106445, -0.01284933090209961, -0.012187719345092773, -0.011526107788085938, -0.010864496231079102, -0.010202884674072266, -0.00954127311706543, -0.008879661560058594, -0.008218050003051758, -0.007556438446044922, -0.006894826889038086, -0.00623321533203125, -0.005571603775024414, -0.004909992218017578, -0.004248380661010742, -0.0035867691040039062, -0.0029251575469970703, -0.0022635459899902344, -0.0016019344329833984, -0.0009403228759765625, -0.00027871131896972656, 0.0003829002380371094, 0.0010445117950439453, 0.0017061233520507812, 0.002367734909057617, 0.003029346466064453, 0.003690958023071289, 0.004352569580078125, 0.005014181137084961, 0.005675792694091797, 0.006337404251098633, 0.006999015808105469, 0.007660627365112305, 0.00832223892211914, 0.008983850479125977, 0.009645462036132812, 0.010307073593139648, 0.010968685150146484, 0.01163029670715332, 0.012291908264160156, 0.012953519821166992, 0.013615131378173828, 0.014276742935180664, 0.0149383544921875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 8.0, 9.0, 18.0, 21.0, 31.0, 34.0, 48.0, 62.0, 125.0, 189.0, 311.0, 543.0, 973.0, 1821.0, 3324.0, 6480.0, 13453.0, 29070.0, 67770.0, 229096.0, 499611.0, 112966.0, 43756.0, 19319.0, 9334.0, 4646.0, 2407.0, 1284.0, 710.0, 401.0, 284.0, 163.0, 107.0, 59.0, 31.0, 27.0, 16.0, 11.0, 15.0, 11.0, 7.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0275421142578125, -0.02673792839050293, -0.02593374252319336, -0.02512955665588379, -0.02432537078857422, -0.02352118492126465, -0.022716999053955078, -0.021912813186645508, -0.021108627319335938, -0.020304441452026367, -0.019500255584716797, -0.018696069717407227, -0.017891883850097656, -0.017087697982788086, -0.016283512115478516, -0.015479326248168945, -0.014675140380859375, -0.013870954513549805, -0.013066768646240234, -0.012262582778930664, -0.011458396911621094, -0.010654211044311523, -0.009850025177001953, -0.009045839309692383, -0.008241653442382812, -0.007437467575073242, -0.006633281707763672, -0.0058290958404541016, -0.005024909973144531, -0.004220724105834961, -0.0034165382385253906, -0.0026123523712158203, -0.00180816650390625, -0.0010039806365966797, -0.00019979476928710938, 0.0006043910980224609, 0.0014085769653320312, 0.0022127628326416016, 0.003016948699951172, 0.003821134567260742, 0.0046253204345703125, 0.005429506301879883, 0.006233692169189453, 0.0070378780364990234, 0.007842063903808594, 0.008646249771118164, 0.009450435638427734, 0.010254621505737305, 0.011058807373046875, 0.011862993240356445, 0.012667179107666016, 0.013471364974975586, 0.014275550842285156, 0.015079736709594727, 0.015883922576904297, 0.016688108444213867, 0.017492294311523438, 0.018296480178833008, 0.019100666046142578, 0.01990485191345215, 0.02070903778076172, 0.02151322364807129, 0.02231740951538086, 0.02312159538269043, 0.02392578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 5.0, 2.0, 4.0, 5.0, 6.0, 12.0, 23.0, 25.0, 16.0, 28.0, 35.0, 27.0, 45.0, 29.0, 34.0, 42.0, 45.0, 64.0, 44.0, 54.0, 53.0, 50.0, 48.0, 39.0, 43.0, 33.0, 30.0, 22.0, 32.0, 30.0, 15.0, 11.0, 12.0, 7.0, 7.0, 7.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0136260986328125, -0.013135910034179688, -0.012645721435546875, -0.012155532836914062, -0.01166534423828125, -0.011175155639648438, -0.010684967041015625, -0.010194778442382812, -0.00970458984375, -0.009214401245117188, -0.008724212646484375, -0.008234024047851562, -0.00774383544921875, -0.0072536468505859375, -0.006763458251953125, -0.0062732696533203125, -0.0057830810546875, -0.0052928924560546875, -0.004802703857421875, -0.0043125152587890625, -0.00382232666015625, -0.0033321380615234375, -0.002841949462890625, -0.0023517608642578125, -0.001861572265625, -0.0013713836669921875, -0.000881195068359375, -0.0003910064697265625, 9.918212890625e-05, 0.0005893707275390625, 0.001079559326171875, 0.0015697479248046875, 0.0020599365234375, 0.0025501251220703125, 0.003040313720703125, 0.0035305023193359375, 0.00402069091796875, 0.0045108795166015625, 0.005001068115234375, 0.0054912567138671875, 0.0059814453125, 0.0064716339111328125, 0.006961822509765625, 0.0074520111083984375, 0.00794219970703125, 0.008432388305664062, 0.008922576904296875, 0.009412765502929688, 0.0099029541015625, 0.010393142700195312, 0.010883331298828125, 0.011373519897460938, 0.01186370849609375, 0.012353897094726562, 0.012844085693359375, 0.013334274291992188, 0.013824462890625, 0.014314651489257812, 0.014804840087890625, 0.015295028686523438, 0.01578521728515625, 0.016275405883789062, 0.016765594482421875, 0.017255783081054688, 0.0177459716796875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 11.0, 23.0, 28.0, 52.0, 89.0, 158.0, 290.0, 575.0, 1218.0, 3466.0, 14106.0, 194370.0, 798420.0, 27264.0, 5247.0, 1758.0, 725.0, 337.0, 171.0, 94.0, 66.0, 41.0, 26.0, 9.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00986480712890625, -0.009526610374450684, -0.009188413619995117, -0.00885021686553955, -0.008512020111083984, -0.008173823356628418, -0.007835626602172852, -0.007497429847717285, -0.007159233093261719, -0.006821036338806152, -0.006482839584350586, -0.0061446428298950195, -0.005806446075439453, -0.005468249320983887, -0.00513005256652832, -0.004791855812072754, -0.0044536590576171875, -0.004115462303161621, -0.0037772655487060547, -0.0034390687942504883, -0.003100872039794922, -0.0027626752853393555, -0.002424478530883789, -0.0020862817764282227, -0.0017480850219726562, -0.0014098882675170898, -0.0010716915130615234, -0.000733494758605957, -0.0003952980041503906, -5.710124969482422e-05, 0.0002810955047607422, 0.0006192922592163086, 0.000957489013671875, 0.0012956857681274414, 0.0016338825225830078, 0.0019720792770385742, 0.0023102760314941406, 0.002648472785949707, 0.0029866695404052734, 0.00332486629486084, 0.0036630630493164062, 0.004001259803771973, 0.004339456558227539, 0.0046776533126831055, 0.005015850067138672, 0.005354046821594238, 0.005692243576049805, 0.006030440330505371, 0.0063686370849609375, 0.006706833839416504, 0.00704503059387207, 0.007383227348327637, 0.007721424102783203, 0.00805962085723877, 0.008397817611694336, 0.008736014366149902, 0.009074211120605469, 0.009412407875061035, 0.009750604629516602, 0.010088801383972168, 0.010426998138427734, 0.0107651948928833, 0.011103391647338867, 0.011441588401794434, 0.01177978515625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 7.0, 3.0, 10.0, 10.0, 10.0, 22.0, 38.0, 37.0, 50.0, 69.0, 93.0, 118.0, 126.0, 94.0, 61.0, 74.0, 35.0, 36.0, 27.0, 22.0, 17.0, 6.0, 5.0, 5.0, 2.0, 8.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.555152893066406e-05, -5.3573399782180786e-05, -5.159527063369751e-05, -4.9617141485214233e-05, -4.763901233673096e-05, -4.566088318824768e-05, -4.3682754039764404e-05, -4.170462489128113e-05, -3.972649574279785e-05, -3.7748366594314575e-05, -3.57702374458313e-05, -3.379210829734802e-05, -3.1813979148864746e-05, -2.983585000038147e-05, -2.7857720851898193e-05, -2.5879591703414917e-05, -2.390146255493164e-05, -2.1923333406448364e-05, -1.9945204257965088e-05, -1.796707510948181e-05, -1.5988945960998535e-05, -1.4010816812515259e-05, -1.2032687664031982e-05, -1.0054558515548706e-05, -8.07642936706543e-06, -6.098300218582153e-06, -4.120171070098877e-06, -2.1420419216156006e-06, -1.6391277313232422e-07, 1.8142163753509521e-06, 3.7923455238342285e-06, 5.770474672317505e-06, 7.748603820800781e-06, 9.726732969284058e-06, 1.1704862117767334e-05, 1.368299126625061e-05, 1.5661120414733887e-05, 1.7639249563217163e-05, 1.961737871170044e-05, 2.1595507860183716e-05, 2.3573637008666992e-05, 2.555176615715027e-05, 2.7529895305633545e-05, 2.950802445411682e-05, 3.14861536026001e-05, 3.3464282751083374e-05, 3.544241189956665e-05, 3.742054104804993e-05, 3.93986701965332e-05, 4.137679934501648e-05, 4.3354928493499756e-05, 4.533305764198303e-05, 4.731118679046631e-05, 4.9289315938949585e-05, 5.126744508743286e-05, 5.324557423591614e-05, 5.5223703384399414e-05, 5.720183253288269e-05, 5.917996168136597e-05, 6.115809082984924e-05, 6.313621997833252e-05, 6.51143491268158e-05, 6.709247827529907e-05, 6.907060742378235e-05, 7.104873657226562e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 7.0, 8.0, 9.0, 11.0, 12.0, 22.0, 25.0, 57.0, 96.0, 180.0, 379.0, 933.0, 2838.0, 12197.0, 130015.0, 858277.0, 34632.0, 5916.0, 1678.0, 635.0, 271.0, 140.0, 63.0, 42.0, 27.0, 28.0, 18.0, 7.0, 5.0, 5.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00849151611328125, -0.008236289024353027, -0.007981061935424805, -0.007725834846496582, -0.007470607757568359, -0.007215380668640137, -0.006960153579711914, -0.006704926490783691, -0.006449699401855469, -0.006194472312927246, -0.0059392452239990234, -0.005684018135070801, -0.005428791046142578, -0.0051735639572143555, -0.004918336868286133, -0.00466310977935791, -0.0044078826904296875, -0.004152655601501465, -0.003897428512573242, -0.0036422014236450195, -0.003386974334716797, -0.0031317472457885742, -0.0028765201568603516, -0.002621293067932129, -0.0023660659790039062, -0.0021108388900756836, -0.001855611801147461, -0.0016003847122192383, -0.0013451576232910156, -0.001089930534362793, -0.0008347034454345703, -0.0005794763565063477, -0.000324249267578125, -6.902217864990234e-05, 0.0001862049102783203, 0.00044143199920654297, 0.0006966590881347656, 0.0009518861770629883, 0.001207113265991211, 0.0014623403549194336, 0.0017175674438476562, 0.001972794532775879, 0.0022280216217041016, 0.0024832487106323242, 0.002738475799560547, 0.0029937028884887695, 0.003248929977416992, 0.003504157066345215, 0.0037593841552734375, 0.00401461124420166, 0.004269838333129883, 0.0045250654220581055, 0.004780292510986328, 0.005035519599914551, 0.0052907466888427734, 0.005545973777770996, 0.005801200866699219, 0.006056427955627441, 0.006311655044555664, 0.006566882133483887, 0.006822109222412109, 0.007077336311340332, 0.007332563400268555, 0.007587790489196777, 0.007843017578125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 8.0, 15.0, 9.0, 17.0, 19.0, 35.0, 53.0, 89.0, 150.0, 205.0, 141.0, 83.0, 52.0, 29.0, 23.0, 11.0, 9.0, 12.0, 3.0, 5.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004543304443359375, -0.004406869411468506, -0.004270434379577637, -0.004133999347686768, -0.0039975643157958984, -0.0038611292839050293, -0.00372469425201416, -0.003588259220123291, -0.003451824188232422, -0.0033153891563415527, -0.0031789541244506836, -0.0030425190925598145, -0.0029060840606689453, -0.002769649028778076, -0.002633213996887207, -0.002496778964996338, -0.0023603439331054688, -0.0022239089012145996, -0.0020874738693237305, -0.0019510388374328613, -0.0018146038055419922, -0.001678168773651123, -0.001541733741760254, -0.0014052987098693848, -0.0012688636779785156, -0.0011324286460876465, -0.0009959936141967773, -0.0008595585823059082, -0.0007231235504150391, -0.0005866885185241699, -0.0004502534866333008, -0.00031381845474243164, -0.0001773834228515625, -4.094839096069336e-05, 9.548664093017578e-05, 0.00023192167282104492, 0.00036835670471191406, 0.0005047917366027832, 0.0006412267684936523, 0.0007776618003845215, 0.0009140968322753906, 0.0010505318641662598, 0.001186966896057129, 0.001323401927947998, 0.0014598369598388672, 0.0015962719917297363, 0.0017327070236206055, 0.0018691420555114746, 0.0020055770874023438, 0.002142012119293213, 0.002278447151184082, 0.002414882183074951, 0.0025513172149658203, 0.0026877522468566895, 0.0028241872787475586, 0.0029606223106384277, 0.003097057342529297, 0.003233492374420166, 0.003369927406311035, 0.0035063624382019043, 0.0036427974700927734, 0.0037792325019836426, 0.003915667533874512, 0.004052102565765381, 0.00418853759765625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 7.0, 15.0, 41.0, 115.0, 523.0, 253.0, 43.0, 9.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6856498718261719, -0.6726462244987488, -0.6596425175666809, -0.6466388702392578, -0.6336352229118347, -0.6206315755844116, -0.6076278686523438, -0.5946242213249207, -0.5816205739974976, -0.5686169266700745, -0.5556132197380066, -0.5426095724105835, -0.5296059250831604, -0.5166022777557373, -0.5035985708236694, -0.49059492349624634, -0.47759121656417847, -0.464587539434433, -0.4515838921070099, -0.4385802149772644, -0.4255765676498413, -0.4125728905200958, -0.39956921339035034, -0.38656556606292725, -0.37356188893318176, -0.3605582118034363, -0.3475545644760132, -0.3345508873462677, -0.3215472102165222, -0.3085435628890991, -0.29553988575935364, -0.28253620862960815, -0.26953256130218506, -0.2565288841724396, -0.24352523684501648, -0.230521559715271, -0.2175178974866867, -0.20451423525810242, -0.19151055812835693, -0.17850689589977264, -0.16550324857234955, -0.15249958634376526, -0.13949590921401978, -0.12649224698543549, -0.1134885847568512, -0.1004849225282669, -0.08748125284910202, -0.07447758316993713, -0.061473920941352844, -0.048470254987478256, -0.03546658903360367, -0.02246292307972908, -0.009459257125854492, 0.0035444051027297974, 0.016548074781894684, 0.02955174446105957, 0.04255540668964386, 0.05555907264351845, 0.06856273859739304, 0.08156640827655792, 0.09457007050514221, 0.1075737327337265, 0.12057740241289139, 0.13358107209205627, 0.14658473432064056]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 12.0, 10.0, 22.0, 37.0, 45.0, 61.0, 77.0, 99.0, 101.0, 116.0, 113.0, 77.0, 77.0, 56.0, 35.0, 26.0, 21.0, 6.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14349758625030518, -0.1387193202972412, -0.13394105434417725, -0.12916278839111328, -0.12438452243804932, -0.11960625648498535, -0.11482798308134079, -0.11004971712827682, -0.10527145117521286, -0.1004931852221489, -0.09571491926908493, -0.09093665331602097, -0.0861583799123764, -0.08138011395931244, -0.07660184800624847, -0.07182358205318451, -0.06704531610012054, -0.06226705014705658, -0.057488784193992615, -0.05271051451563835, -0.04793224856257439, -0.04315398260951042, -0.03837571293115616, -0.033597446978092194, -0.02881918102502823, -0.024040915071964264, -0.01926264725625515, -0.01448438037186861, -0.009706113487482071, -0.004927847534418106, -0.000149579718708992, 0.004628688097000122, 0.009406954050064087, 0.014185220934450626, 0.018963487818837166, 0.02374175563454628, 0.028520021587610245, 0.03329828754067421, 0.03807655721902847, 0.04285482317209244, 0.0476330891251564, 0.05241135507822037, 0.05718962103128433, 0.061967890709638596, 0.06674616038799286, 0.07152442634105682, 0.07630269229412079, 0.08108095824718475, 0.08585922420024872, 0.09063749015331268, 0.09541575610637665, 0.10019402205944061, 0.10497228801250458, 0.10975055396556854, 0.1145288273692131, 0.11930709332227707, 0.12408535927534103, 0.1288636326789856, 0.13364189863204956, 0.13842016458511353, 0.1431984305381775, 0.14797669649124146, 0.15275496244430542, 0.15753322839736938, 0.16231149435043335]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 6.0, 5.0, 2.0, 7.0, 15.0, 20.0, 12.0, 21.0, 20.0, 24.0, 40.0, 44.0, 85.0, 221.0, 649.0, 2842.0, 17943.0, 4131835.0, 35362.0, 3602.0, 754.0, 251.0, 157.0, 112.0, 62.0, 68.0, 39.0, 19.0, 15.0, 15.0, 9.0, 5.0, 5.0, 5.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1439208984375, -0.14019393920898438, -0.13646697998046875, -0.13274002075195312, -0.1290130615234375, -0.12528610229492188, -0.12155914306640625, -0.11783218383789062, -0.114105224609375, -0.11037826538085938, -0.10665130615234375, -0.10292434692382812, -0.0991973876953125, -0.09547042846679688, -0.09174346923828125, -0.08801651000976562, -0.08428955078125, -0.08056259155273438, -0.07683563232421875, -0.07310867309570312, -0.0693817138671875, -0.06565475463867188, -0.06192779541015625, -0.058200836181640625, -0.054473876953125, -0.050746917724609375, -0.04701995849609375, -0.043292999267578125, -0.0395660400390625, -0.035839080810546875, -0.03211212158203125, -0.028385162353515625, -0.024658203125, -0.020931243896484375, -0.01720428466796875, -0.013477325439453125, -0.0097503662109375, -0.006023406982421875, -0.00229644775390625, 0.001430511474609375, 0.005157470703125, 0.008884429931640625, 0.01261138916015625, 0.016338348388671875, 0.0200653076171875, 0.023792266845703125, 0.02751922607421875, 0.031246185302734375, 0.03497314453125, 0.038700103759765625, 0.04242706298828125, 0.046154022216796875, 0.0498809814453125, 0.053607940673828125, 0.05733489990234375, 0.061061859130859375, 0.064788818359375, 0.06851577758789062, 0.07224273681640625, 0.07596969604492188, 0.0796966552734375, 0.08342361450195312, 0.08715057373046875, 0.09087753295898438, 0.0946044921875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 12.0, 38.0, 95.0, 283.0, 380.0, 115.0, 43.0, 22.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.025970458984375, -0.02533864974975586, -0.02470684051513672, -0.024075031280517578, -0.023443222045898438, -0.022811412811279297, -0.022179603576660156, -0.021547794342041016, -0.020915985107421875, -0.020284175872802734, -0.019652366638183594, -0.019020557403564453, -0.018388748168945312, -0.017756938934326172, -0.01712512969970703, -0.01649332046508789, -0.01586151123046875, -0.01522970199584961, -0.014597892761230469, -0.013966083526611328, -0.013334274291992188, -0.012702465057373047, -0.012070655822753906, -0.011438846588134766, -0.010807037353515625, -0.010175228118896484, -0.009543418884277344, -0.008911609649658203, -0.008279800415039062, -0.007647991180419922, -0.007016181945800781, -0.006384372711181641, -0.0057525634765625, -0.005120754241943359, -0.004488945007324219, -0.003857135772705078, -0.0032253265380859375, -0.002593517303466797, -0.0019617080688476562, -0.0013298988342285156, -0.000698089599609375, -6.628036499023438e-05, 0.0005655288696289062, 0.0011973381042480469, 0.0018291473388671875, 0.002460956573486328, 0.0030927658081054688, 0.0037245750427246094, 0.00435638427734375, 0.004988193511962891, 0.005620002746582031, 0.006251811981201172, 0.0068836212158203125, 0.007515430450439453, 0.008147239685058594, 0.008779048919677734, 0.009410858154296875, 0.010042667388916016, 0.010674476623535156, 0.011306285858154297, 0.011938095092773438, 0.012569904327392578, 0.013201713562011719, 0.01383352279663086, 0.01446533203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 8.0, 7.0, 14.0, 14.0, 24.0, 24.0, 30.0, 43.0, 57.0, 75.0, 121.0, 239.0, 537.0, 1358.0, 5560.0, 35038.0, 3039622.0, 1073110.0, 30220.0, 5585.0, 1482.0, 525.0, 228.0, 124.0, 81.0, 45.0, 26.0, 23.0, 12.0, 9.0, 5.0, 4.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0394287109375, -0.038390159606933594, -0.03735160827636719, -0.03631305694580078, -0.035274505615234375, -0.03423595428466797, -0.03319740295410156, -0.032158851623535156, -0.03112030029296875, -0.030081748962402344, -0.029043197631835938, -0.02800464630126953, -0.026966094970703125, -0.02592754364013672, -0.024888992309570312, -0.023850440979003906, -0.0228118896484375, -0.021773338317871094, -0.020734786987304688, -0.01969623565673828, -0.018657684326171875, -0.01761913299560547, -0.016580581665039062, -0.015542030334472656, -0.01450347900390625, -0.013464927673339844, -0.012426376342773438, -0.011387825012207031, -0.010349273681640625, -0.009310722351074219, -0.008272171020507812, -0.007233619689941406, -0.006195068359375, -0.005156517028808594, -0.0041179656982421875, -0.0030794143676757812, -0.002040863037109375, -0.0010023117065429688, 3.62396240234375e-05, 0.0010747909545898438, 0.00211334228515625, 0.0031518936157226562, 0.0041904449462890625, 0.005228996276855469, 0.006267547607421875, 0.007306098937988281, 0.008344650268554688, 0.009383201599121094, 0.0104217529296875, 0.011460304260253906, 0.012498855590820312, 0.013537406921386719, 0.014575958251953125, 0.015614509582519531, 0.016653060913085938, 0.017691612243652344, 0.01873016357421875, 0.019768714904785156, 0.020807266235351562, 0.02184581756591797, 0.022884368896484375, 0.02392292022705078, 0.024961471557617188, 0.026000022888183594, 0.02703857421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 3.0, 9.0, 16.0, 19.0, 17.0, 17.0, 28.0, 25.0, 34.0, 45.0, 46.0, 72.0, 86.0, 116.0, 228.0, 743.0, 1537.0, 417.0, 192.0, 131.0, 87.0, 63.0, 36.0, 26.0, 13.0, 12.0, 11.0, 6.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01275634765625, -0.012423992156982422, -0.012091636657714844, -0.011759281158447266, -0.011426925659179688, -0.01109457015991211, -0.010762214660644531, -0.010429859161376953, -0.010097503662109375, -0.009765148162841797, -0.009432792663574219, -0.00910043716430664, -0.008768081665039062, -0.008435726165771484, -0.008103370666503906, -0.007771015167236328, -0.00743865966796875, -0.007106304168701172, -0.006773948669433594, -0.006441593170166016, -0.0061092376708984375, -0.005776882171630859, -0.005444526672363281, -0.005112171173095703, -0.004779815673828125, -0.004447460174560547, -0.004115104675292969, -0.0037827491760253906, -0.0034503936767578125, -0.0031180381774902344, -0.0027856826782226562, -0.002453327178955078, -0.0021209716796875, -0.0017886161804199219, -0.0014562606811523438, -0.0011239051818847656, -0.0007915496826171875, -0.0004591941833496094, -0.00012683868408203125, 0.00020551681518554688, 0.000537872314453125, 0.0008702278137207031, 0.0012025833129882812, 0.0015349388122558594, 0.0018672943115234375, 0.0021996498107910156, 0.0025320053100585938, 0.002864360809326172, 0.00319671630859375, 0.003529071807861328, 0.0038614273071289062, 0.004193782806396484, 0.0045261383056640625, 0.004858493804931641, 0.005190849304199219, 0.005523204803466797, 0.005855560302734375, 0.006187915802001953, 0.006520271301269531, 0.006852626800537109, 0.0071849822998046875, 0.007517337799072266, 0.007849693298339844, 0.008182048797607422, 0.008514404296875]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 44.0, 966.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.49735212326049805, -0.4687346816062927, -0.4401172399520874, -0.4114997684955597, -0.38288232684135437, -0.35426488518714905, -0.32564741373062134, -0.297029972076416, -0.2684125304222107, -0.23979508876800537, -0.21117763221263885, -0.18256017565727234, -0.15394273400306702, -0.1253252923488617, -0.09670783579349518, -0.06809037923812866, -0.03947293758392334, -0.01085548847913742, 0.0177619606256485, 0.04637940973043442, 0.07499685883522034, 0.10361430048942566, 0.13223175704479218, 0.1608492136001587, 0.189466655254364, 0.21808409690856934, 0.24670155346393585, 0.27531901001930237, 0.3039364516735077, 0.332553893327713, 0.3611713647842407, 0.38978880643844604, 0.41840624809265137, 0.4470236897468567, 0.475641131401062, 0.5042585730552673, 0.5328760147094727, 0.5614935159683228, 0.5901109576225281, 0.6187283992767334, 0.6473458409309387, 0.675963282585144, 0.7045807242393494, 0.7331981658935547, 0.7618156671524048, 0.7904330492019653, 0.8190505504608154, 0.8476679921150208, 0.8762854337692261, 0.9049028754234314, 0.9335203170776367, 0.962137758731842, 0.9907552003860474, 1.0193727016448975, 1.047990083694458, 1.076607584953308, 1.1052250862121582, 1.1338425874710083, 1.1624599695205688, 1.191077470779419, 1.2196948528289795, 1.2483123540878296, 1.2769297361373901, 1.3055472373962402, 1.3341646194458008]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 17.0, 20.0, 26.0, 37.0, 38.0, 31.0, 39.0, 61.0, 73.0, 84.0, 66.0, 85.0, 70.0, 54.0, 65.0, 57.0, 47.0, 32.0, 30.0, 20.0, 13.0, 8.0, 7.0, 6.0, 1.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0845295786857605, -0.08220262825489044, -0.07987567037343979, -0.07754871249198914, -0.07522176206111908, -0.07289481163024902, -0.07056785374879837, -0.06824089586734772, -0.06591394543647766, -0.0635869950056076, -0.06126003712415695, -0.0589330829679966, -0.05660612881183624, -0.05427917465567589, -0.05195222049951553, -0.04962526634335518, -0.047298312187194824, -0.04497135803103447, -0.042644403874874115, -0.04031744971871376, -0.037990495562553406, -0.03566354140639305, -0.0333365872502327, -0.031009633094072342, -0.028682678937911987, -0.026355724781751633, -0.024028770625591278, -0.021701816469430923, -0.01937486231327057, -0.017047908157110214, -0.01472095400094986, -0.012393999844789505, -0.01006704568862915, -0.007740091532468796, -0.005413137376308441, -0.0030861832201480865, -0.0007592290639877319, 0.0015677250921726227, 0.0038946792483329773, 0.006221633404493332, 0.008548587560653687, 0.010875541716814041, 0.013202495872974396, 0.01552945002913475, 0.017856404185295105, 0.02018335834145546, 0.022510312497615814, 0.02483726665377617, 0.027164220809936523, 0.029491174966096878, 0.03181812912225723, 0.03414508327841759, 0.03647203743457794, 0.038798991590738297, 0.04112594574689865, 0.043452899903059006, 0.04577985405921936, 0.048106808215379715, 0.05043376237154007, 0.052760716527700424, 0.05508767068386078, 0.05741462484002113, 0.05974157899618149, 0.06206853315234184, 0.0643954873085022]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 8.0, 11.0, 10.0, 11.0, 16.0, 18.0, 22.0, 28.0, 38.0, 59.0, 76.0, 134.0, 146.0, 167.0, 285.0, 420.0, 688.0, 1820.0, 9245.0, 168068.0, 834847.0, 26450.0, 3288.0, 988.0, 504.0, 326.0, 217.0, 188.0, 96.0, 97.0, 67.0, 64.0, 32.0, 25.0, 18.0, 15.0, 10.0, 16.0, 5.0, 10.0, 4.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.056121826171875, -0.054379940032958984, -0.05263805389404297, -0.05089616775512695, -0.04915428161621094, -0.04741239547729492, -0.045670509338378906, -0.04392862319946289, -0.042186737060546875, -0.04044485092163086, -0.038702964782714844, -0.03696107864379883, -0.03521919250488281, -0.0334773063659668, -0.03173542022705078, -0.029993534088134766, -0.02825164794921875, -0.026509761810302734, -0.02476787567138672, -0.023025989532470703, -0.021284103393554688, -0.019542217254638672, -0.017800331115722656, -0.01605844497680664, -0.014316558837890625, -0.01257467269897461, -0.010832786560058594, -0.009090900421142578, -0.0073490142822265625, -0.005607128143310547, -0.0038652420043945312, -0.0021233558654785156, -0.0003814697265625, 0.0013604164123535156, 0.0031023025512695312, 0.004844188690185547, 0.0065860748291015625, 0.008327960968017578, 0.010069847106933594, 0.01181173324584961, 0.013553619384765625, 0.01529550552368164, 0.017037391662597656, 0.018779277801513672, 0.020521163940429688, 0.022263050079345703, 0.02400493621826172, 0.025746822357177734, 0.02748870849609375, 0.029230594635009766, 0.03097248077392578, 0.0327143669128418, 0.03445625305175781, 0.03619813919067383, 0.037940025329589844, 0.03968191146850586, 0.041423797607421875, 0.04316568374633789, 0.044907569885253906, 0.04664945602416992, 0.04839134216308594, 0.05013322830200195, 0.05187511444091797, 0.053617000579833984, 0.05535888671875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 16.0, 44.0, 120.0, 337.0, 322.0, 101.0, 32.0, 15.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.02691650390625, -0.02627408504486084, -0.02563166618347168, -0.02498924732208252, -0.02434682846069336, -0.0237044095993042, -0.02306199073791504, -0.02241957187652588, -0.02177715301513672, -0.02113473415374756, -0.0204923152923584, -0.01984989643096924, -0.019207477569580078, -0.018565058708190918, -0.017922639846801758, -0.017280220985412598, -0.016637802124023438, -0.015995383262634277, -0.015352964401245117, -0.014710545539855957, -0.014068126678466797, -0.013425707817077637, -0.012783288955688477, -0.012140870094299316, -0.011498451232910156, -0.010856032371520996, -0.010213613510131836, -0.009571194648742676, -0.008928775787353516, -0.008286356925964355, -0.007643938064575195, -0.007001519203186035, -0.006359100341796875, -0.005716681480407715, -0.005074262619018555, -0.0044318437576293945, -0.0037894248962402344, -0.0031470060348510742, -0.002504587173461914, -0.001862168312072754, -0.0012197494506835938, -0.0005773305892944336, 6.508827209472656e-05, 0.0007075071334838867, 0.0013499259948730469, 0.001992344856262207, 0.002634763717651367, 0.0032771825790405273, 0.0039196014404296875, 0.004562020301818848, 0.005204439163208008, 0.005846858024597168, 0.006489276885986328, 0.007131695747375488, 0.0077741146087646484, 0.008416533470153809, 0.009058952331542969, 0.009701371192932129, 0.010343790054321289, 0.01098620891571045, 0.01162862777709961, 0.01227104663848877, 0.01291346549987793, 0.01355588436126709, 0.01419830322265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 5.0, 15.0, 6.0, 11.0, 17.0, 16.0, 15.0, 24.0, 39.0, 29.0, 34.0, 60.0, 57.0, 73.0, 139.0, 224.0, 578.0, 3418.0, 227134.0, 805762.0, 9212.0, 783.0, 271.0, 149.0, 89.0, 66.0, 59.0, 49.0, 45.0, 23.0, 24.0, 20.0, 20.0, 22.0, 14.0, 10.0, 6.0, 7.0, 9.0, 4.0, 3.0, 1.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0809326171875, -0.07856273651123047, -0.07619285583496094, -0.0738229751586914, -0.07145309448242188, -0.06908321380615234, -0.06671333312988281, -0.06434345245361328, -0.06197357177734375, -0.05960369110107422, -0.05723381042480469, -0.054863929748535156, -0.052494049072265625, -0.050124168395996094, -0.04775428771972656, -0.04538440704345703, -0.0430145263671875, -0.04064464569091797, -0.03827476501464844, -0.035904884338378906, -0.033535003662109375, -0.031165122985839844, -0.028795242309570312, -0.02642536163330078, -0.02405548095703125, -0.02168560028076172, -0.019315719604492188, -0.016945838928222656, -0.014575958251953125, -0.012206077575683594, -0.009836196899414062, -0.007466316223144531, -0.005096435546875, -0.0027265548706054688, -0.0003566741943359375, 0.0020132064819335938, 0.004383087158203125, 0.006752967834472656, 0.009122848510742188, 0.011492729187011719, 0.01386260986328125, 0.01623249053955078, 0.018602371215820312, 0.020972251892089844, 0.023342132568359375, 0.025712013244628906, 0.028081893920898438, 0.03045177459716797, 0.0328216552734375, 0.03519153594970703, 0.03756141662597656, 0.039931297302246094, 0.042301177978515625, 0.044671058654785156, 0.04704093933105469, 0.04941082000732422, 0.05178070068359375, 0.05415058135986328, 0.05652046203613281, 0.058890342712402344, 0.061260223388671875, 0.0636301040649414, 0.06599998474121094, 0.06836986541748047, 0.07073974609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 1.0, 8.0, 12.0, 8.0, 10.0, 15.0, 17.0, 11.0, 21.0, 21.0, 23.0, 21.0, 36.0, 27.0, 35.0, 42.0, 50.0, 51.0, 44.0, 43.0, 43.0, 52.0, 46.0, 39.0, 33.0, 33.0, 21.0, 36.0, 35.0, 32.0, 13.0, 16.0, 20.0, 16.0, 10.0, 14.0, 8.0, 8.0, 5.0, 8.0, 3.0, 2.0, 4.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-0.0129547119140625, -0.012572050094604492, -0.012189388275146484, -0.011806726455688477, -0.011424064636230469, -0.011041402816772461, -0.010658740997314453, -0.010276079177856445, -0.009893417358398438, -0.00951075553894043, -0.009128093719482422, -0.008745431900024414, -0.008362770080566406, -0.007980108261108398, -0.007597446441650391, -0.007214784622192383, -0.006832122802734375, -0.006449460983276367, -0.006066799163818359, -0.0056841373443603516, -0.005301475524902344, -0.004918813705444336, -0.004536151885986328, -0.00415349006652832, -0.0037708282470703125, -0.0033881664276123047, -0.003005504608154297, -0.002622842788696289, -0.0022401809692382812, -0.0018575191497802734, -0.0014748573303222656, -0.0010921955108642578, -0.00070953369140625, -0.0003268718719482422, 5.5789947509765625e-05, 0.00043845176696777344, 0.0008211135864257812, 0.001203775405883789, 0.0015864372253417969, 0.0019690990447998047, 0.0023517608642578125, 0.0027344226837158203, 0.003117084503173828, 0.003499746322631836, 0.0038824081420898438, 0.0042650699615478516, 0.004647731781005859, 0.005030393600463867, 0.005413055419921875, 0.005795717239379883, 0.006178379058837891, 0.0065610408782958984, 0.006943702697753906, 0.007326364517211914, 0.007709026336669922, 0.00809168815612793, 0.008474349975585938, 0.008857011795043945, 0.009239673614501953, 0.009622335433959961, 0.010004997253417969, 0.010387659072875977, 0.010770320892333984, 0.011152982711791992, 0.01153564453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 6.0, 5.0, 10.0, 18.0, 28.0, 43.0, 84.0, 184.0, 536.0, 1639.0, 6723.0, 83538.0, 930637.0, 20147.0, 3406.0, 930.0, 332.0, 136.0, 59.0, 41.0, 20.0, 18.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01300048828125, -0.01246500015258789, -0.011929512023925781, -0.011394023895263672, -0.010858535766601562, -0.010323047637939453, -0.009787559509277344, -0.009252071380615234, -0.008716583251953125, -0.008181095123291016, -0.007645606994628906, -0.007110118865966797, -0.0065746307373046875, -0.006039142608642578, -0.005503654479980469, -0.004968166351318359, -0.00443267822265625, -0.0038971900939941406, -0.0033617019653320312, -0.002826213836669922, -0.0022907257080078125, -0.0017552375793457031, -0.0012197494506835938, -0.0006842613220214844, -0.000148773193359375, 0.0003867149353027344, 0.0009222030639648438, 0.0014576911926269531, 0.0019931793212890625, 0.002528667449951172, 0.0030641555786132812, 0.0035996437072753906, 0.0041351318359375, 0.004670619964599609, 0.005206108093261719, 0.005741596221923828, 0.0062770843505859375, 0.006812572479248047, 0.007348060607910156, 0.007883548736572266, 0.008419036865234375, 0.008954524993896484, 0.009490013122558594, 0.010025501251220703, 0.010560989379882812, 0.011096477508544922, 0.011631965637207031, 0.01216745376586914, 0.01270294189453125, 0.01323843002319336, 0.013773918151855469, 0.014309406280517578, 0.014844894409179688, 0.015380382537841797, 0.015915870666503906, 0.016451358795166016, 0.016986846923828125, 0.017522335052490234, 0.018057823181152344, 0.018593311309814453, 0.019128799438476562, 0.019664287567138672, 0.02019977569580078, 0.02073526382446289, 0.021270751953125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 10.0, 18.0, 36.0, 87.0, 269.0, 342.0, 115.0, 38.0, 28.0, 10.0, 5.0, 2.0, 7.0, 2.0, 7.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003323554992675781, -0.00032166019082069397, -0.0003109648823738098, -0.00030026957392692566, -0.0002895742654800415, -0.00027887895703315735, -0.0002681836485862732, -0.00025748834013938904, -0.0002467930316925049, -0.00023609772324562073, -0.00022540241479873657, -0.00021470710635185242, -0.00020401179790496826, -0.0001933164894580841, -0.00018262118101119995, -0.0001719258725643158, -0.00016123056411743164, -0.00015053525567054749, -0.00013983994722366333, -0.00012914463877677917, -0.00011844933032989502, -0.00010775402188301086, -9.705871343612671e-05, -8.636340498924255e-05, -7.56680965423584e-05, -6.497278809547424e-05, -5.427747964859009e-05, -4.358217120170593e-05, -3.288686275482178e-05, -2.2191554307937622e-05, -1.1496245861053467e-05, -8.009374141693115e-07, 9.894371032714844e-06, 2.0589679479599e-05, 3.1284987926483154e-05, 4.198029637336731e-05, 5.2675604820251465e-05, 6.337091326713562e-05, 7.406622171401978e-05, 8.476153016090393e-05, 9.545683860778809e-05, 0.00010615214705467224, 0.0001168474555015564, 0.00012754276394844055, 0.0001382380723953247, 0.00014893338084220886, 0.00015962868928909302, 0.00017032399773597717, 0.00018101930618286133, 0.00019171461462974548, 0.00020240992307662964, 0.0002131052315235138, 0.00022380053997039795, 0.0002344958484172821, 0.00024519115686416626, 0.0002558864653110504, 0.00026658177375793457, 0.0002772770822048187, 0.0002879723906517029, 0.00029866769909858704, 0.0003093630075454712, 0.00032005831599235535, 0.0003307536244392395, 0.00034144893288612366, 0.0003521442413330078]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 7.0, 9.0, 11.0, 11.0, 7.0, 8.0, 13.0, 24.0, 28.0, 54.0, 93.0, 202.0, 1225.0, 151545.0, 892661.0, 2091.0, 278.0, 107.0, 50.0, 29.0, 25.0, 12.0, 8.0, 8.0, 13.0, 7.0, 3.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0157012939453125, -0.01522684097290039, -0.014752388000488281, -0.014277935028076172, -0.013803482055664062, -0.013329029083251953, -0.012854576110839844, -0.012380123138427734, -0.011905670166015625, -0.011431217193603516, -0.010956764221191406, -0.010482311248779297, -0.010007858276367188, -0.009533405303955078, -0.009058952331542969, -0.00858449935913086, -0.00811004638671875, -0.007635593414306641, -0.007161140441894531, -0.006686687469482422, -0.0062122344970703125, -0.005737781524658203, -0.005263328552246094, -0.004788875579833984, -0.004314422607421875, -0.0038399696350097656, -0.0033655166625976562, -0.002891063690185547, -0.0024166107177734375, -0.0019421577453613281, -0.0014677047729492188, -0.0009932518005371094, -0.000518798828125, -4.4345855712890625e-05, 0.00043010711669921875, 0.0009045600891113281, 0.0013790130615234375, 0.0018534660339355469, 0.0023279190063476562, 0.0028023719787597656, 0.003276824951171875, 0.0037512779235839844, 0.004225730895996094, 0.004700183868408203, 0.0051746368408203125, 0.005649089813232422, 0.006123542785644531, 0.006597995758056641, 0.00707244873046875, 0.007546901702880859, 0.008021354675292969, 0.008495807647705078, 0.008970260620117188, 0.009444713592529297, 0.009919166564941406, 0.010393619537353516, 0.010868072509765625, 0.011342525482177734, 0.011816978454589844, 0.012291431427001953, 0.012765884399414062, 0.013240337371826172, 0.013714790344238281, 0.01418924331665039, 0.0146636962890625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 4.0, 3.0, 9.0, 7.0, 9.0, 14.0, 5.0, 8.0, 9.0, 13.0, 26.0, 27.0, 48.0, 68.0, 99.0, 124.0, 121.0, 112.0, 78.0, 60.0, 47.0, 25.0, 23.0, 9.0, 6.0, 9.0, 12.0, 6.0, 6.0, 5.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0024127960205078125, -0.002338320016860962, -0.0022638440132141113, -0.0021893680095672607, -0.00211489200592041, -0.0020404160022735596, -0.001965939998626709, -0.0018914639949798584, -0.0018169879913330078, -0.0017425119876861572, -0.0016680359840393066, -0.001593559980392456, -0.0015190839767456055, -0.0014446079730987549, -0.0013701319694519043, -0.0012956559658050537, -0.0012211799621582031, -0.0011467039585113525, -0.001072227954864502, -0.0009977519512176514, -0.0009232759475708008, -0.0008487999439239502, -0.0007743239402770996, -0.000699847936630249, -0.0006253719329833984, -0.0005508959293365479, -0.00047641992568969727, -0.0004019439220428467, -0.0003274679183959961, -0.0002529919147491455, -0.00017851591110229492, -0.00010403990745544434, -2.956390380859375e-05, 4.4912099838256836e-05, 0.00011938810348510742, 0.000193864107131958, 0.0002683401107788086, 0.0003428161144256592, 0.00041729211807250977, 0.0004917681217193604, 0.0005662441253662109, 0.0006407201290130615, 0.0007151961326599121, 0.0007896721363067627, 0.0008641481399536133, 0.0009386241436004639, 0.0010131001472473145, 0.001087576150894165, 0.0011620521545410156, 0.0012365281581878662, 0.0013110041618347168, 0.0013854801654815674, 0.001459956169128418, 0.0015344321727752686, 0.0016089081764221191, 0.0016833841800689697, 0.0017578601837158203, 0.001832336187362671, 0.0019068121910095215, 0.001981288194656372, 0.0020557641983032227, 0.0021302402019500732, 0.002204716205596924, 0.0022791922092437744, 0.002353668212890625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 35.0, 358.0, 494.0, 92.0, 20.0, 5.0, 4.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4038991332054138, -0.39511099457740784, -0.38632285594940186, -0.3775346875190735, -0.3687465488910675, -0.3599584102630615, -0.35117027163505554, -0.34238213300704956, -0.3335939943790436, -0.3248058557510376, -0.3160177171230316, -0.30722957849502563, -0.29844141006469727, -0.2896532714366913, -0.2808651328086853, -0.2720769941806793, -0.26328885555267334, -0.25450071692466736, -0.24571256339550018, -0.2369244247674942, -0.22813628613948822, -0.21934813261032104, -0.21055999398231506, -0.20177185535430908, -0.1929836869239807, -0.18419554829597473, -0.17540739476680756, -0.16661925613880157, -0.1578311175107956, -0.14904296398162842, -0.14025482535362244, -0.13146668672561646, -0.12267856299877167, -0.11389041692018509, -0.10510227829217911, -0.09631413221359253, -0.08752599358558655, -0.07873784750699997, -0.06994970142841339, -0.06116155907511711, -0.05237341672182083, -0.04358527436852455, -0.03479713201522827, -0.026008985936641693, -0.017220843583345413, -0.008432701230049133, 0.00035544484853744507, 0.009143587201833725, 0.017931729555130005, 0.026719871908426285, 0.035508014261722565, 0.04429616034030914, 0.05308430269360542, 0.0618724450469017, 0.07066059112548828, 0.07944872975349426, 0.08823687583208084, 0.09702502191066742, 0.1058131605386734, 0.11460130661725998, 0.12338945269584656, 0.13217759132385254, 0.14096572995185852, 0.1497538834810257, 0.15854202210903168]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 10.0, 11.0, 20.0, 35.0, 54.0, 71.0, 72.0, 87.0, 82.0, 95.0, 108.0, 89.0, 96.0, 63.0, 34.0, 27.0, 22.0, 8.0, 5.0, 8.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09727424383163452, -0.09344995021820068, -0.08962565660476685, -0.0858013704419136, -0.08197707682847977, -0.07815278321504593, -0.07432849705219269, -0.07050420343875885, -0.06667990982532501, -0.06285561621189117, -0.059031326323747635, -0.055207036435604095, -0.05138274282217026, -0.04755844920873642, -0.04373415932059288, -0.03990986943244934, -0.0360855758190155, -0.032261282205581665, -0.028436992317438126, -0.024612700566649437, -0.02078840881586075, -0.01696411706507206, -0.013139825314283371, -0.009315533563494682, -0.005491241812705994, -0.001666950061917305, 0.0021573416888713837, 0.005981633439660072, 0.009805925190448761, 0.01363021694123745, 0.01745450869202614, 0.021278800442814827, 0.025103092193603516, 0.028927383944392204, 0.03275167569518089, 0.03657596558332443, 0.04040025919675827, 0.04422455281019211, 0.04804884269833565, 0.05187313258647919, 0.055697426199913025, 0.05952171981334686, 0.0633460134267807, 0.06717029958963394, 0.07099459320306778, 0.07481888681650162, 0.07864317297935486, 0.0824674665927887, 0.08629176020622253, 0.09011605381965637, 0.09394034743309021, 0.09776463359594345, 0.10158892720937729, 0.10541322082281113, 0.10923750698566437, 0.1130618005990982, 0.11688609421253204, 0.12071038782596588, 0.12453468143939972, 0.12835897505283356, 0.1321832537651062, 0.13600754737854004, 0.13983184099197388, 0.14365613460540771, 0.14748042821884155]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 7.0, 5.0, 7.0, 12.0, 23.0, 38.0, 59.0, 113.0, 391.0, 1680.0, 397498.0, 3791634.0, 2283.0, 307.0, 114.0, 52.0, 25.0, 9.0, 9.0, 9.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1334228515625, -0.13009071350097656, -0.12675857543945312, -0.12342643737792969, -0.12009429931640625, -0.11676216125488281, -0.11343002319335938, -0.11009788513183594, -0.1067657470703125, -0.10343360900878906, -0.10010147094726562, -0.09676933288574219, -0.09343719482421875, -0.09010505676269531, -0.08677291870117188, -0.08344078063964844, -0.080108642578125, -0.07677650451660156, -0.07344436645507812, -0.07011222839355469, -0.06678009033203125, -0.06344795227050781, -0.060115814208984375, -0.05678367614746094, -0.0534515380859375, -0.05011940002441406, -0.046787261962890625, -0.04345512390136719, -0.04012298583984375, -0.03679084777832031, -0.033458709716796875, -0.030126571655273438, -0.02679443359375, -0.023462295532226562, -0.020130157470703125, -0.016798019409179688, -0.01346588134765625, -0.010133743286132812, -0.006801605224609375, -0.0034694671630859375, -0.0001373291015625, 0.0031948089599609375, 0.006526947021484375, 0.009859085083007812, 0.01319122314453125, 0.016523361206054688, 0.019855499267578125, 0.023187637329101562, 0.026519775390625, 0.029851913452148438, 0.033184051513671875, 0.03651618957519531, 0.03984832763671875, 0.04318046569824219, 0.046512603759765625, 0.04984474182128906, 0.0531768798828125, 0.05650901794433594, 0.059841156005859375, 0.06317329406738281, 0.06650543212890625, 0.06983757019042969, 0.07316970825195312, 0.07650184631347656, 0.079833984375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 10.0, 11.0, 36.0, 86.0, 284.0, 367.0, 145.0, 38.0, 22.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0257110595703125, -0.025101065635681152, -0.024491071701049805, -0.023881077766418457, -0.02327108383178711, -0.02266108989715576, -0.022051095962524414, -0.021441102027893066, -0.02083110809326172, -0.02022111415863037, -0.019611120223999023, -0.019001126289367676, -0.018391132354736328, -0.01778113842010498, -0.017171144485473633, -0.016561150550842285, -0.015951156616210938, -0.01534116268157959, -0.014731168746948242, -0.014121174812316895, -0.013511180877685547, -0.0129011869430542, -0.012291193008422852, -0.011681199073791504, -0.011071205139160156, -0.010461211204528809, -0.009851217269897461, -0.009241223335266113, -0.008631229400634766, -0.008021235466003418, -0.00741124153137207, -0.006801247596740723, -0.006191253662109375, -0.005581259727478027, -0.00497126579284668, -0.004361271858215332, -0.0037512779235839844, -0.0031412839889526367, -0.002531290054321289, -0.0019212961196899414, -0.0013113021850585938, -0.0007013082504272461, -9.131431579589844e-05, 0.0005186796188354492, 0.0011286735534667969, 0.0017386674880981445, 0.002348661422729492, 0.00295865535736084, 0.0035686492919921875, 0.004178643226623535, 0.004788637161254883, 0.0053986310958862305, 0.006008625030517578, 0.006618618965148926, 0.0072286128997802734, 0.007838606834411621, 0.008448600769042969, 0.009058594703674316, 0.009668588638305664, 0.010278582572937012, 0.01088857650756836, 0.011498570442199707, 0.012108564376831055, 0.012718558311462402, 0.01332855224609375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 8.0, 5.0, 10.0, 19.0, 23.0, 36.0, 37.0, 66.0, 96.0, 139.0, 245.0, 429.0, 983.0, 2784.0, 11978.0, 155310.0, 3878630.0, 127620.0, 11176.0, 2638.0, 1010.0, 452.0, 210.0, 123.0, 63.0, 43.0, 40.0, 30.0, 15.0, 13.0, 12.0, 12.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.032440185546875, -0.03149914741516113, -0.030558109283447266, -0.0296170711517334, -0.02867603302001953, -0.027734994888305664, -0.026793956756591797, -0.02585291862487793, -0.024911880493164062, -0.023970842361450195, -0.023029804229736328, -0.02208876609802246, -0.021147727966308594, -0.020206689834594727, -0.01926565170288086, -0.018324613571166992, -0.017383575439453125, -0.016442537307739258, -0.01550149917602539, -0.014560461044311523, -0.013619422912597656, -0.012678384780883789, -0.011737346649169922, -0.010796308517456055, -0.009855270385742188, -0.00891423225402832, -0.007973194122314453, -0.007032155990600586, -0.006091117858886719, -0.0051500797271728516, -0.004209041595458984, -0.003268003463745117, -0.00232696533203125, -0.0013859272003173828, -0.0004448890686035156, 0.0004961490631103516, 0.0014371871948242188, 0.002378225326538086, 0.003319263458251953, 0.00426030158996582, 0.0052013397216796875, 0.006142377853393555, 0.007083415985107422, 0.008024454116821289, 0.008965492248535156, 0.009906530380249023, 0.01084756851196289, 0.011788606643676758, 0.012729644775390625, 0.013670682907104492, 0.01461172103881836, 0.015552759170532227, 0.016493797302246094, 0.01743483543395996, 0.018375873565673828, 0.019316911697387695, 0.020257949829101562, 0.02119898796081543, 0.022140026092529297, 0.023081064224243164, 0.02402210235595703, 0.0249631404876709, 0.025904178619384766, 0.026845216751098633, 0.0277862548828125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 8.0, 7.0, 8.0, 6.0, 7.0, 11.0, 24.0, 25.0, 37.0, 40.0, 66.0, 109.0, 119.0, 159.0, 260.0, 437.0, 763.0, 724.0, 384.0, 261.0, 198.0, 132.0, 89.0, 64.0, 34.0, 27.0, 23.0, 13.0, 12.0, 9.0, 6.0, 4.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.01125335693359375, -0.010931015014648438, -0.010608673095703125, -0.010286331176757812, -0.0099639892578125, -0.009641647338867188, -0.009319305419921875, -0.008996963500976562, -0.00867462158203125, -0.008352279663085938, -0.008029937744140625, -0.0077075958251953125, -0.00738525390625, -0.0070629119873046875, -0.006740570068359375, -0.0064182281494140625, -0.00609588623046875, -0.0057735443115234375, -0.005451202392578125, -0.0051288604736328125, -0.0048065185546875, -0.0044841766357421875, -0.004161834716796875, -0.0038394927978515625, -0.00351715087890625, -0.0031948089599609375, -0.002872467041015625, -0.0025501251220703125, -0.002227783203125, -0.0019054412841796875, -0.001583099365234375, -0.0012607574462890625, -0.00093841552734375, -0.0006160736083984375, -0.000293731689453125, 2.86102294921875e-05, 0.0003509521484375, 0.0006732940673828125, 0.000995635986328125, 0.0013179779052734375, 0.00164031982421875, 0.0019626617431640625, 0.002285003662109375, 0.0026073455810546875, 0.0029296875, 0.0032520294189453125, 0.003574371337890625, 0.0038967132568359375, 0.00421905517578125, 0.0045413970947265625, 0.004863739013671875, 0.0051860809326171875, 0.0055084228515625, 0.0058307647705078125, 0.006153106689453125, 0.0064754486083984375, 0.00679779052734375, 0.0071201324462890625, 0.007442474365234375, 0.0077648162841796875, 0.008087158203125, 0.008409500122070312, 0.008731842041015625, 0.009054183959960938, 0.00937652587890625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 6.0, 65.0, 814.0, 123.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20801952481269836, -0.1984012871980667, -0.18878304958343506, -0.1791648119688034, -0.16954657435417175, -0.1599283367395401, -0.15031009912490845, -0.1406918615102768, -0.13107362389564514, -0.12145538628101349, -0.11183714866638184, -0.10221891105175018, -0.09260067343711853, -0.08298243582248688, -0.07336419820785522, -0.06374596059322357, -0.05412772297859192, -0.044509485363960266, -0.03489124774932861, -0.02527301013469696, -0.015654772520065308, -0.006036534905433655, 0.003581702709197998, 0.013199940323829651, 0.022818177938461304, 0.03243641555309296, 0.04205465316772461, 0.05167289078235626, 0.061291128396987915, 0.07090936601161957, 0.08052760362625122, 0.09014584124088287, 0.09976407885551453, 0.10938231647014618, 0.11900055408477783, 0.12861879169940948, 0.13823702931404114, 0.1478552669286728, 0.15747350454330444, 0.1670917421579361, 0.17670997977256775, 0.1863282173871994, 0.19594645500183105, 0.2055646926164627, 0.21518293023109436, 0.224801167845726, 0.23441940546035767, 0.24403764307498932, 0.25365588068962097, 0.2632741332054138, 0.2728923559188843, 0.28251057863235474, 0.2921288311481476, 0.30174708366394043, 0.3113653063774109, 0.32098352909088135, 0.3306017816066742, 0.34022003412246704, 0.3498382568359375, 0.35945647954940796, 0.3690747320652008, 0.37869298458099365, 0.3883112072944641, 0.39792943000793457, 0.4075476825237274]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 7.0, 9.0, 12.0, 17.0, 15.0, 17.0, 23.0, 23.0, 31.0, 43.0, 44.0, 49.0, 53.0, 58.0, 63.0, 49.0, 58.0, 60.0, 55.0, 56.0, 49.0, 34.0, 38.0, 33.0, 25.0, 21.0, 13.0, 15.0, 13.0, 3.0, 7.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04817080497741699, -0.04672170430421829, -0.045272599905729294, -0.043823495507240295, -0.042374394834041595, -0.040925294160842896, -0.0394761897623539, -0.0380270853638649, -0.0365779846906662, -0.0351288840174675, -0.0336797796189785, -0.0322306752204895, -0.030781574547290802, -0.029332472011446953, -0.027883369475603104, -0.026434266939759254, -0.024985164403915405, -0.023536061868071556, -0.022086959332227707, -0.020637856796383858, -0.01918875426054001, -0.01773965172469616, -0.01629054918885231, -0.014841446653008461, -0.013392344117164612, -0.011943241581320763, -0.010494139045476913, -0.009045036509633064, -0.007595933973789215, -0.006146831437945366, -0.004697728902101517, -0.0032486263662576675, -0.0017995238304138184, -0.0003504212945699692, 0.00109868124127388, 0.002547783777117729, 0.003996886312961578, 0.0054459888488054276, 0.006895091384649277, 0.008344193920493126, 0.009793296456336975, 0.011242398992180824, 0.012691501528024673, 0.014140604063868523, 0.015589706599712372, 0.01703880913555622, 0.01848791167140007, 0.01993701420724392, 0.02138611674308777, 0.022835219278931618, 0.024284321814775467, 0.025733424350619316, 0.027182526886463165, 0.028631629422307014, 0.030080731958150864, 0.03152983635663986, 0.03297893702983856, 0.03442803770303726, 0.03587714210152626, 0.03732624650001526, 0.03877534717321396, 0.04022444784641266, 0.04167355224490166, 0.043122656643390656, 0.044571757316589355]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 10.0, 2.0, 5.0, 11.0, 6.0, 14.0, 26.0, 32.0, 37.0, 64.0, 94.0, 194.0, 307.0, 647.0, 3598.0, 589902.0, 448778.0, 3334.0, 656.0, 316.0, 205.0, 92.0, 69.0, 52.0, 35.0, 15.0, 19.0, 12.0, 6.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11224365234375, -0.1079244613647461, -0.10360527038574219, -0.09928607940673828, -0.09496688842773438, -0.09064769744873047, -0.08632850646972656, -0.08200931549072266, -0.07769012451171875, -0.07337093353271484, -0.06905174255371094, -0.06473255157470703, -0.060413360595703125, -0.05609416961669922, -0.05177497863769531, -0.047455787658691406, -0.0431365966796875, -0.038817405700683594, -0.03449821472167969, -0.03017902374267578, -0.025859832763671875, -0.02154064178466797, -0.017221450805664062, -0.012902259826660156, -0.00858306884765625, -0.004263877868652344, 5.53131103515625e-05, 0.004374504089355469, 0.008693695068359375, 0.013012886047363281, 0.017332077026367188, 0.021651268005371094, 0.025970458984375, 0.030289649963378906, 0.03460884094238281, 0.03892803192138672, 0.043247222900390625, 0.04756641387939453, 0.05188560485839844, 0.056204795837402344, 0.06052398681640625, 0.06484317779541016, 0.06916236877441406, 0.07348155975341797, 0.07780075073242188, 0.08211994171142578, 0.08643913269042969, 0.0907583236694336, 0.0950775146484375, 0.0993967056274414, 0.10371589660644531, 0.10803508758544922, 0.11235427856445312, 0.11667346954345703, 0.12099266052246094, 0.12531185150146484, 0.12963104248046875, 0.13395023345947266, 0.13826942443847656, 0.14258861541748047, 0.14690780639648438, 0.15122699737548828, 0.1555461883544922, 0.1598653793334961, 0.1641845703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 10.0, 27.0, 71.0, 255.0, 383.0, 180.0, 48.0, 21.0, 10.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0264739990234375, -0.025862693786621094, -0.025251388549804688, -0.02464008331298828, -0.024028778076171875, -0.02341747283935547, -0.022806167602539062, -0.022194862365722656, -0.02158355712890625, -0.020972251892089844, -0.020360946655273438, -0.01974964141845703, -0.019138336181640625, -0.01852703094482422, -0.017915725708007812, -0.017304420471191406, -0.016693115234375, -0.016081809997558594, -0.015470504760742188, -0.014859199523925781, -0.014247894287109375, -0.013636589050292969, -0.013025283813476562, -0.012413978576660156, -0.01180267333984375, -0.011191368103027344, -0.010580062866210938, -0.009968757629394531, -0.009357452392578125, -0.008746147155761719, -0.008134841918945312, -0.007523536682128906, -0.0069122314453125, -0.006300926208496094, -0.0056896209716796875, -0.005078315734863281, -0.004467010498046875, -0.0038557052612304688, -0.0032444000244140625, -0.0026330947875976562, -0.00202178955078125, -0.0014104843139648438, -0.0007991790771484375, -0.00018787384033203125, 0.000423431396484375, 0.0010347366333007812, 0.0016460418701171875, 0.0022573471069335938, 0.00286865234375, 0.0034799575805664062, 0.0040912628173828125, 0.004702568054199219, 0.005313873291015625, 0.005925178527832031, 0.0065364837646484375, 0.007147789001464844, 0.00775909423828125, 0.008370399475097656, 0.008981704711914062, 0.009593009948730469, 0.010204315185546875, 0.010815620422363281, 0.011426925659179688, 0.012038230895996094, 0.0126495361328125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 5.0, 6.0, 5.0, 14.0, 9.0, 22.0, 27.0, 22.0, 35.0, 54.0, 73.0, 110.0, 151.0, 206.0, 343.0, 565.0, 1313.0, 4553.0, 34511.0, 676207.0, 307889.0, 17144.0, 2870.0, 958.0, 448.0, 303.0, 170.0, 142.0, 96.0, 56.0, 59.0, 48.0, 31.0, 17.0, 25.0, 9.0, 10.0, 12.0, 8.0, 5.0, 5.0, 4.0, 1.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04705810546875, -0.04558086395263672, -0.04410362243652344, -0.042626380920410156, -0.041149139404296875, -0.039671897888183594, -0.03819465637207031, -0.03671741485595703, -0.03524017333984375, -0.03376293182373047, -0.03228569030761719, -0.030808448791503906, -0.029331207275390625, -0.027853965759277344, -0.026376724243164062, -0.02489948272705078, -0.0234222412109375, -0.02194499969482422, -0.020467758178710938, -0.018990516662597656, -0.017513275146484375, -0.016036033630371094, -0.014558792114257812, -0.013081550598144531, -0.01160430908203125, -0.010127067565917969, -0.008649826049804688, -0.007172584533691406, -0.005695343017578125, -0.004218101501464844, -0.0027408599853515625, -0.0012636184692382812, 0.000213623046875, 0.0016908645629882812, 0.0031681060791015625, 0.004645347595214844, 0.006122589111328125, 0.007599830627441406, 0.009077072143554688, 0.010554313659667969, 0.01203155517578125, 0.013508796691894531, 0.014986038208007812, 0.016463279724121094, 0.017940521240234375, 0.019417762756347656, 0.020895004272460938, 0.02237224578857422, 0.0238494873046875, 0.02532672882080078, 0.026803970336914062, 0.028281211853027344, 0.029758453369140625, 0.031235694885253906, 0.03271293640136719, 0.03419017791748047, 0.03566741943359375, 0.03714466094970703, 0.03862190246582031, 0.040099143981933594, 0.041576385498046875, 0.043053627014160156, 0.04453086853027344, 0.04600811004638672, 0.0474853515625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 4.0, 6.0, 8.0, 13.0, 6.0, 20.0, 24.0, 18.0, 33.0, 44.0, 40.0, 51.0, 50.0, 74.0, 62.0, 65.0, 64.0, 49.0, 60.0, 60.0, 49.0, 47.0, 29.0, 27.0, 18.0, 16.0, 12.0, 9.0, 7.0, 7.0, 3.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01457977294921875, -0.01410520076751709, -0.01363062858581543, -0.01315605640411377, -0.01268148422241211, -0.01220691204071045, -0.011732339859008789, -0.011257767677307129, -0.010783195495605469, -0.010308623313903809, -0.009834051132202148, -0.009359478950500488, -0.008884906768798828, -0.008410334587097168, -0.007935762405395508, -0.007461190223693848, -0.0069866180419921875, -0.006512045860290527, -0.006037473678588867, -0.005562901496887207, -0.005088329315185547, -0.004613757133483887, -0.0041391849517822266, -0.0036646127700805664, -0.0031900405883789062, -0.002715468406677246, -0.002240896224975586, -0.0017663240432739258, -0.0012917518615722656, -0.0008171796798706055, -0.0003426074981689453, 0.00013196468353271484, 0.000606536865234375, 0.0010811090469360352, 0.0015556812286376953, 0.0020302534103393555, 0.0025048255920410156, 0.0029793977737426758, 0.003453969955444336, 0.003928542137145996, 0.004403114318847656, 0.004877686500549316, 0.0053522586822509766, 0.005826830863952637, 0.006301403045654297, 0.006775975227355957, 0.007250547409057617, 0.007725119590759277, 0.008199691772460938, 0.008674263954162598, 0.009148836135864258, 0.009623408317565918, 0.010097980499267578, 0.010572552680969238, 0.011047124862670898, 0.011521697044372559, 0.011996269226074219, 0.012470841407775879, 0.012945413589477539, 0.0134199857711792, 0.01389455795288086, 0.01436913013458252, 0.01484370231628418, 0.01531827449798584, 0.0157928466796875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 4.0, 4.0, 7.0, 7.0, 6.0, 16.0, 32.0, 54.0, 88.0, 186.0, 398.0, 893.0, 2404.0, 10700.0, 941984.0, 84309.0, 4754.0, 1534.0, 597.0, 271.0, 130.0, 63.0, 40.0, 20.0, 15.0, 12.0, 5.0, 2.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05987548828125, -0.05833148956298828, -0.05678749084472656, -0.055243492126464844, -0.053699493408203125, -0.052155494689941406, -0.05061149597167969, -0.04906749725341797, -0.04752349853515625, -0.04597949981689453, -0.04443550109863281, -0.042891502380371094, -0.041347503662109375, -0.039803504943847656, -0.03825950622558594, -0.03671550750732422, -0.0351715087890625, -0.03362751007080078, -0.03208351135253906, -0.030539512634277344, -0.028995513916015625, -0.027451515197753906, -0.025907516479492188, -0.02436351776123047, -0.02281951904296875, -0.02127552032470703, -0.019731521606445312, -0.018187522888183594, -0.016643524169921875, -0.015099525451660156, -0.013555526733398438, -0.012011528015136719, -0.010467529296875, -0.008923530578613281, -0.0073795318603515625, -0.005835533142089844, -0.004291534423828125, -0.0027475357055664062, -0.0012035369873046875, 0.00034046173095703125, 0.00188446044921875, 0.0034284591674804688, 0.0049724578857421875, 0.006516456604003906, 0.008060455322265625, 0.009604454040527344, 0.011148452758789062, 0.012692451477050781, 0.0142364501953125, 0.01578044891357422, 0.017324447631835938, 0.018868446350097656, 0.020412445068359375, 0.021956443786621094, 0.023500442504882812, 0.02504444122314453, 0.02658843994140625, 0.02813243865966797, 0.029676437377929688, 0.031220436096191406, 0.032764434814453125, 0.034308433532714844, 0.03585243225097656, 0.03739643096923828, 0.0389404296875]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 11.0, 10.0, 13.0, 14.0, 12.0, 17.0, 30.0, 34.0, 37.0, 52.0, 73.0, 85.0, 107.0, 114.0, 82.0, 56.0, 66.0, 39.0, 21.0, 28.0, 18.0, 9.0, 7.0, 9.0, 4.0, 7.0, 4.0, 7.0, 5.0, 8.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011730194091796875, -0.00011307001113891602, -0.00010883808135986328, -0.00010460615158081055, -0.00010037422180175781, -9.614229202270508e-05, -9.191036224365234e-05, -8.767843246459961e-05, -8.344650268554688e-05, -7.921457290649414e-05, -7.49826431274414e-05, -7.075071334838867e-05, -6.651878356933594e-05, -6.22868537902832e-05, -5.805492401123047e-05, -5.3822994232177734e-05, -4.9591064453125e-05, -4.5359134674072266e-05, -4.112720489501953e-05, -3.68952751159668e-05, -3.266334533691406e-05, -2.8431415557861328e-05, -2.4199485778808594e-05, -1.996755599975586e-05, -1.5735626220703125e-05, -1.150369644165039e-05, -7.271766662597656e-06, -3.039836883544922e-06, 1.1920928955078125e-06, 5.424022674560547e-06, 9.655952453613281e-06, 1.3887882232666016e-05, 1.811981201171875e-05, 2.2351741790771484e-05, 2.658367156982422e-05, 3.081560134887695e-05, 3.504753112792969e-05, 3.927946090698242e-05, 4.3511390686035156e-05, 4.774332046508789e-05, 5.1975250244140625e-05, 5.620718002319336e-05, 6.0439109802246094e-05, 6.467103958129883e-05, 6.890296936035156e-05, 7.31348991394043e-05, 7.736682891845703e-05, 8.159875869750977e-05, 8.58306884765625e-05, 9.006261825561523e-05, 9.429454803466797e-05, 9.85264778137207e-05, 0.00010275840759277344, 0.00010699033737182617, 0.0001112222671508789, 0.00011545419692993164, 0.00011968612670898438, 0.0001239180564880371, 0.00012814998626708984, 0.00013238191604614258, 0.0001366138458251953, 0.00014084577560424805, 0.00014507770538330078, 0.00014930963516235352, 0.00015354156494140625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 2.0, 8.0, 6.0, 11.0, 9.0, 15.0, 11.0, 25.0, 27.0, 34.0, 44.0, 74.0, 96.0, 130.0, 199.0, 376.0, 737.0, 2164.0, 9102.0, 89191.0, 878821.0, 56980.0, 7055.0, 1751.0, 697.0, 318.0, 192.0, 116.0, 96.0, 63.0, 43.0, 36.0, 24.0, 26.0, 16.0, 12.0, 13.0, 8.0, 6.0, 5.0, 5.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01520538330078125, -0.014705538749694824, -0.014205694198608398, -0.013705849647521973, -0.013206005096435547, -0.012706160545349121, -0.012206315994262695, -0.01170647144317627, -0.011206626892089844, -0.010706782341003418, -0.010206937789916992, -0.009707093238830566, -0.00920724868774414, -0.008707404136657715, -0.008207559585571289, -0.007707715034484863, -0.0072078704833984375, -0.006708025932312012, -0.006208181381225586, -0.00570833683013916, -0.005208492279052734, -0.004708647727966309, -0.004208803176879883, -0.003708958625793457, -0.0032091140747070312, -0.0027092695236206055, -0.0022094249725341797, -0.001709580421447754, -0.0012097358703613281, -0.0007098913192749023, -0.00021004676818847656, 0.0002897977828979492, 0.000789642333984375, 0.0012894868850708008, 0.0017893314361572266, 0.0022891759872436523, 0.002789020538330078, 0.003288865089416504, 0.0037887096405029297, 0.0042885541915893555, 0.004788398742675781, 0.005288243293762207, 0.005788087844848633, 0.006287932395935059, 0.006787776947021484, 0.00728762149810791, 0.007787466049194336, 0.008287310600280762, 0.008787155151367188, 0.009286999702453613, 0.009786844253540039, 0.010286688804626465, 0.01078653335571289, 0.011286377906799316, 0.011786222457885742, 0.012286067008972168, 0.012785911560058594, 0.01328575611114502, 0.013785600662231445, 0.014285445213317871, 0.014785289764404297, 0.015285134315490723, 0.01578497886657715, 0.016284823417663574, 0.01678466796875]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 8.0, 7.0, 5.0, 7.0, 7.0, 9.0, 11.0, 11.0, 16.0, 26.0, 19.0, 40.0, 51.0, 66.0, 71.0, 86.0, 104.0, 104.0, 82.0, 58.0, 44.0, 23.0, 34.0, 18.0, 13.0, 11.0, 15.0, 14.0, 6.0, 3.0, 5.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.004825592041015625, -0.0046805739402771, -0.004535555839538574, -0.004390537738800049, -0.0042455196380615234, -0.004100501537322998, -0.003955483436584473, -0.0038104653358459473, -0.003665447235107422, -0.0035204291343688965, -0.003375411033630371, -0.0032303929328918457, -0.0030853748321533203, -0.002940356731414795, -0.0027953386306762695, -0.002650320529937744, -0.0025053024291992188, -0.0023602843284606934, -0.002215266227722168, -0.0020702481269836426, -0.0019252300262451172, -0.0017802119255065918, -0.0016351938247680664, -0.001490175724029541, -0.0013451576232910156, -0.0012001395225524902, -0.0010551214218139648, -0.0009101033210754395, -0.0007650852203369141, -0.0006200671195983887, -0.0004750490188598633, -0.0003300309181213379, -0.0001850128173828125, -3.999471664428711e-05, 0.00010502338409423828, 0.00025004148483276367, 0.00039505958557128906, 0.0005400776863098145, 0.0006850957870483398, 0.0008301138877868652, 0.0009751319885253906, 0.001120150089263916, 0.0012651681900024414, 0.0014101862907409668, 0.0015552043914794922, 0.0017002224922180176, 0.001845240592956543, 0.0019902586936950684, 0.0021352767944335938, 0.002280294895172119, 0.0024253129959106445, 0.00257033109664917, 0.0027153491973876953, 0.0028603672981262207, 0.003005385398864746, 0.0031504034996032715, 0.003295421600341797, 0.0034404397010803223, 0.0035854578018188477, 0.003730475902557373, 0.0038754940032958984, 0.004020512104034424, 0.004165530204772949, 0.004310548305511475, 0.00445556640625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 39.0, 197.0, 421.0, 270.0, 54.0, 16.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.22038838267326355, -0.2153385430574417, -0.21028870344161987, -0.20523886382579803, -0.2001890242099762, -0.19513919949531555, -0.1900893598794937, -0.18503952026367188, -0.17998968064785004, -0.1749398410320282, -0.16989000141620636, -0.16484016180038452, -0.15979033708572388, -0.15474049746990204, -0.1496906578540802, -0.14464081823825836, -0.13959097862243652, -0.13454113900661469, -0.12949129939079285, -0.1244414672255516, -0.11939162760972977, -0.11434178799390793, -0.10929195582866669, -0.10424211621284485, -0.09919227659702301, -0.09414243698120117, -0.08909259736537933, -0.08404276520013809, -0.07899292558431625, -0.07394308596849442, -0.06889325380325317, -0.06384341418743134, -0.058793582022190094, -0.053743742406368256, -0.048693906515836716, -0.043644070625305176, -0.03859423100948334, -0.0335443913936615, -0.02849455550312996, -0.02344471961259842, -0.01839487999677658, -0.013345042243599892, -0.008295204490423203, -0.0032453667372465134, 0.0018044710159301758, 0.006854308769106865, 0.011904146522283554, 0.016953982412815094, 0.022003822028636932, 0.02705365978181362, 0.03210349753499031, 0.03715333342552185, 0.04220317304134369, 0.04725301265716553, 0.05230284854769707, 0.05735268443822861, 0.062402524054050446, 0.06745236366987228, 0.07250219583511353, 0.07755203545093536, 0.0826018750667572, 0.08765171468257904, 0.09270155429840088, 0.09775138646364212, 0.10280122607946396]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 11.0, 19.0, 18.0, 21.0, 28.0, 30.0, 36.0, 48.0, 55.0, 53.0, 56.0, 55.0, 51.0, 65.0, 49.0, 52.0, 57.0, 40.0, 51.0, 36.0, 38.0, 24.0, 31.0, 13.0, 11.0, 13.0, 6.0, 8.0, 6.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0446050763130188, -0.04306285083293915, -0.0415206253528595, -0.039978399872779846, -0.038436174392700195, -0.036893948912620544, -0.035351723432540894, -0.03380949795246124, -0.03226727247238159, -0.03072504699230194, -0.02918282151222229, -0.02764059603214264, -0.02609837055206299, -0.024556145071983337, -0.023013919591903687, -0.021471694111824036, -0.019929468631744385, -0.018387243151664734, -0.016845017671585083, -0.015302792191505432, -0.013760566711425781, -0.01221834123134613, -0.01067611575126648, -0.009133890271186829, -0.007591664791107178, -0.006049439311027527, -0.004507213830947876, -0.002964988350868225, -0.0014227628707885742, 0.00011946260929107666, 0.0016616880893707275, 0.0032039135694503784, 0.004746139049530029, 0.00628836452960968, 0.007830590009689331, 0.009372815489768982, 0.010915040969848633, 0.012457266449928284, 0.013999491930007935, 0.015541717410087585, 0.017083942890167236, 0.018626168370246887, 0.020168393850326538, 0.02171061933040619, 0.02325284481048584, 0.02479507029056549, 0.02633729577064514, 0.027879521250724792, 0.029421746730804443, 0.030963972210884094, 0.032506197690963745, 0.034048423171043396, 0.03559064865112305, 0.0371328741312027, 0.03867509961128235, 0.040217325091362, 0.04175955057144165, 0.0433017760515213, 0.04484400153160095, 0.0463862270116806, 0.047928452491760254, 0.049470677971839905, 0.051012903451919556, 0.05255512893199921, 0.05409735441207886]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 9.0, 20.0, 39.0, 72.0, 133.0, 272.0, 794.0, 4857.0, 4154517.0, 31274.0, 1765.0, 316.0, 112.0, 47.0, 25.0, 6.0, 5.0, 4.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1060791015625, -0.10353708267211914, -0.10099506378173828, -0.09845304489135742, -0.09591102600097656, -0.0933690071105957, -0.09082698822021484, -0.08828496932983398, -0.08574295043945312, -0.08320093154907227, -0.0806589126586914, -0.07811689376831055, -0.07557487487792969, -0.07303285598754883, -0.07049083709716797, -0.06794881820678711, -0.06540679931640625, -0.06286478042602539, -0.06032276153564453, -0.05778074264526367, -0.05523872375488281, -0.05269670486450195, -0.050154685974121094, -0.047612667083740234, -0.045070648193359375, -0.042528629302978516, -0.039986610412597656, -0.0374445915222168, -0.03490257263183594, -0.03236055374145508, -0.02981853485107422, -0.02727651596069336, -0.0247344970703125, -0.02219247817993164, -0.01965045928955078, -0.017108440399169922, -0.014566421508789062, -0.012024402618408203, -0.009482383728027344, -0.006940364837646484, -0.004398345947265625, -0.0018563270568847656, 0.0006856918334960938, 0.003227710723876953, 0.0057697296142578125, 0.008311748504638672, 0.010853767395019531, 0.01339578628540039, 0.01593780517578125, 0.01847982406616211, 0.02102184295654297, 0.023563861846923828, 0.026105880737304688, 0.028647899627685547, 0.031189918518066406, 0.033731937408447266, 0.036273956298828125, 0.038815975189208984, 0.041357994079589844, 0.0439000129699707, 0.04644203186035156, 0.04898405075073242, 0.05152606964111328, 0.05406808853149414, 0.056610107421875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 13.0, 28.0, 111.0, 323.0, 328.0, 143.0, 34.0, 17.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0242767333984375, -0.023685455322265625, -0.02309417724609375, -0.022502899169921875, -0.02191162109375, -0.021320343017578125, -0.02072906494140625, -0.020137786865234375, -0.0195465087890625, -0.018955230712890625, -0.01836395263671875, -0.017772674560546875, -0.017181396484375, -0.016590118408203125, -0.01599884033203125, -0.015407562255859375, -0.0148162841796875, -0.014225006103515625, -0.01363372802734375, -0.013042449951171875, -0.012451171875, -0.011859893798828125, -0.01126861572265625, -0.010677337646484375, -0.0100860595703125, -0.009494781494140625, -0.00890350341796875, -0.008312225341796875, -0.007720947265625, -0.007129669189453125, -0.00653839111328125, -0.005947113037109375, -0.0053558349609375, -0.004764556884765625, -0.00417327880859375, -0.003582000732421875, -0.00299072265625, -0.002399444580078125, -0.00180816650390625, -0.001216888427734375, -0.0006256103515625, -3.4332275390625e-05, 0.00055694580078125, 0.001148223876953125, 0.001739501953125, 0.002330780029296875, 0.00292205810546875, 0.003513336181640625, 0.0041046142578125, 0.004695892333984375, 0.00528717041015625, 0.005878448486328125, 0.0064697265625, 0.007061004638671875, 0.00765228271484375, 0.008243560791015625, 0.0088348388671875, 0.009426116943359375, 0.01001739501953125, 0.010608673095703125, 0.011199951171875, 0.011791229248046875, 0.01238250732421875, 0.012973785400390625, 0.0135650634765625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 6.0, 4.0, 8.0, 7.0, 11.0, 22.0, 32.0, 34.0, 51.0, 84.0, 112.0, 196.0, 338.0, 774.0, 1853.0, 7310.0, 94055.0, 3759178.0, 312055.0, 13417.0, 2694.0, 922.0, 466.0, 256.0, 134.0, 84.0, 56.0, 38.0, 18.0, 24.0, 14.0, 7.0, 9.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.028350830078125, -0.027532577514648438, -0.026714324951171875, -0.025896072387695312, -0.02507781982421875, -0.024259567260742188, -0.023441314697265625, -0.022623062133789062, -0.0218048095703125, -0.020986557006835938, -0.020168304443359375, -0.019350051879882812, -0.01853179931640625, -0.017713546752929688, -0.016895294189453125, -0.016077041625976562, -0.0152587890625, -0.014440536499023438, -0.013622283935546875, -0.012804031372070312, -0.01198577880859375, -0.011167526245117188, -0.010349273681640625, -0.009531021118164062, -0.0087127685546875, -0.007894515991210938, -0.007076263427734375, -0.0062580108642578125, -0.00543975830078125, -0.0046215057373046875, -0.003803253173828125, -0.0029850006103515625, -0.002166748046875, -0.0013484954833984375, -0.000530242919921875, 0.0002880096435546875, 0.00110626220703125, 0.0019245147705078125, 0.002742767333984375, 0.0035610198974609375, 0.0043792724609375, 0.0051975250244140625, 0.006015777587890625, 0.0068340301513671875, 0.00765228271484375, 0.008470535278320312, 0.009288787841796875, 0.010107040405273438, 0.01092529296875, 0.011743545532226562, 0.012561798095703125, 0.013380050659179688, 0.01419830322265625, 0.015016555786132812, 0.015834808349609375, 0.016653060913085938, 0.0174713134765625, 0.018289566040039062, 0.019107818603515625, 0.019926071166992188, 0.02074432373046875, 0.021562576293945312, 0.022380828857421875, 0.023199081420898438, 0.024017333984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 7.0, 5.0, 3.0, 7.0, 14.0, 20.0, 19.0, 25.0, 45.0, 56.0, 78.0, 127.0, 145.0, 203.0, 329.0, 466.0, 655.0, 540.0, 392.0, 295.0, 204.0, 132.0, 96.0, 64.0, 40.0, 32.0, 21.0, 19.0, 10.0, 7.0, 8.0, 3.0, 6.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01026153564453125, -0.009915947914123535, -0.00957036018371582, -0.009224772453308105, -0.00887918472290039, -0.008533596992492676, -0.008188009262084961, -0.007842421531677246, -0.007496833801269531, -0.007151246070861816, -0.0068056583404541016, -0.006460070610046387, -0.006114482879638672, -0.005768895149230957, -0.005423307418823242, -0.005077719688415527, -0.0047321319580078125, -0.004386544227600098, -0.004040956497192383, -0.003695368766784668, -0.003349781036376953, -0.0030041933059692383, -0.0026586055755615234, -0.0023130178451538086, -0.0019674301147460938, -0.001621842384338379, -0.001276254653930664, -0.0009306669235229492, -0.0005850791931152344, -0.00023949146270751953, 0.00010609626770019531, 0.00045168399810791016, 0.000797271728515625, 0.0011428594589233398, 0.0014884471893310547, 0.0018340349197387695, 0.0021796226501464844, 0.0025252103805541992, 0.002870798110961914, 0.003216385841369629, 0.0035619735717773438, 0.003907561302185059, 0.0042531490325927734, 0.004598736763000488, 0.004944324493408203, 0.005289912223815918, 0.005635499954223633, 0.005981087684631348, 0.0063266754150390625, 0.006672263145446777, 0.007017850875854492, 0.007363438606262207, 0.007709026336669922, 0.008054614067077637, 0.008400201797485352, 0.008745789527893066, 0.009091377258300781, 0.009436964988708496, 0.009782552719116211, 0.010128140449523926, 0.01047372817993164, 0.010819315910339355, 0.01116490364074707, 0.011510491371154785, 0.0118560791015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 17.0, 193.0, 666.0, 121.0, 8.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16346091032028198, -0.1558249294757843, -0.14818893373012543, -0.14055293798446655, -0.13291695713996887, -0.1252809762954712, -0.11764498054981232, -0.11000899225473404, -0.10237300395965576, -0.09473701566457748, -0.0871010273694992, -0.07946503907442093, -0.07182905077934265, -0.06419306248426437, -0.056557074189186096, -0.04892108589410782, -0.04128509759902954, -0.03364910930395126, -0.026013121008872986, -0.018377132713794708, -0.01074114441871643, -0.003105156123638153, 0.0045308321714401245, 0.012166820466518402, 0.01980280876159668, 0.027438797056674957, 0.035074785351753235, 0.04271077364683151, 0.05034676194190979, 0.05798275023698807, 0.06561873853206635, 0.07325472682714462, 0.0808907151222229, 0.08852670341730118, 0.09616269171237946, 0.10379868000745773, 0.11143466830253601, 0.11907065659761429, 0.12670664489269257, 0.13434264063835144, 0.14197862148284912, 0.1496146023273468, 0.15725059807300568, 0.16488659381866455, 0.17252257466316223, 0.1801585555076599, 0.1877945512533188, 0.19543054699897766, 0.20306652784347534, 0.21070250868797302, 0.2183385044336319, 0.22597450017929077, 0.23361048102378845, 0.24124646186828613, 0.248882457613945, 0.2565184533596039, 0.26415443420410156, 0.27179041504859924, 0.2794263958930969, 0.287062406539917, 0.2946983873844147, 0.30233436822891235, 0.3099703788757324, 0.3176063597202301, 0.3252423405647278]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 2.0, 7.0, 14.0, 6.0, 11.0, 13.0, 12.0, 21.0, 18.0, 31.0, 27.0, 21.0, 34.0, 30.0, 52.0, 31.0, 47.0, 37.0, 37.0, 40.0, 45.0, 47.0, 47.0, 35.0, 35.0, 39.0, 40.0, 39.0, 18.0, 26.0, 22.0, 20.0, 18.0, 10.0, 19.0, 9.0, 8.0, 10.0, 3.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.030735492706298828, -0.02974744886159897, -0.02875940315425396, -0.02777135744690895, -0.02678331360220909, -0.02579526975750923, -0.024807224050164223, -0.023819178342819214, -0.022831134498119354, -0.021843090653419495, -0.020855044946074486, -0.019866999238729477, -0.018878955394029617, -0.017890911549329758, -0.01690286584198475, -0.01591482013463974, -0.01492677628993988, -0.013938731513917446, -0.012950686737895012, -0.011962641961872578, -0.010974597185850143, -0.00998655240982771, -0.008998507633805275, -0.00801046285778284, -0.0070224180817604065, -0.006034373305737972, -0.005046328529715538, -0.004058283753693104, -0.0030702389776706696, -0.0020821942016482353, -0.001094149425625801, -0.00010610464960336685, 0.0008819401264190674, 0.0018699849024415016, 0.002858029678463936, 0.00384607445448637, 0.004834119230508804, 0.0058221640065312386, 0.006810208782553673, 0.007798253558576107, 0.008786298334598541, 0.009774343110620975, 0.01076238788664341, 0.011750432662665844, 0.012738477438688278, 0.013726522214710712, 0.014714566990733147, 0.015702612698078156, 0.016690656542778015, 0.017678700387477875, 0.018666746094822884, 0.019654791802167892, 0.020642835646867752, 0.02163087949156761, 0.02261892519891262, 0.02360697090625763, 0.02459501475095749, 0.02558305859565735, 0.026571104303002357, 0.027559150010347366, 0.028547193855047226, 0.029535237699747086, 0.030523283407092094, 0.0315113291144371, 0.03249937295913696]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 6.0, 7.0, 7.0, 13.0, 24.0, 20.0, 34.0, 29.0, 50.0, 43.0, 85.0, 83.0, 135.0, 210.0, 262.0, 384.0, 663.0, 1536.0, 10833.0, 586365.0, 435538.0, 8822.0, 1391.0, 629.0, 405.0, 251.0, 184.0, 125.0, 97.0, 90.0, 53.0, 45.0, 26.0, 23.0, 23.0, 17.0, 10.0, 6.0, 5.0, 4.0, 7.0, 4.0, 3.0, 1.0, 5.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03924560546875, -0.037734031677246094, -0.03622245788574219, -0.03471088409423828, -0.033199310302734375, -0.03168773651123047, -0.030176162719726562, -0.028664588928222656, -0.02715301513671875, -0.025641441345214844, -0.024129867553710938, -0.02261829376220703, -0.021106719970703125, -0.01959514617919922, -0.018083572387695312, -0.016571998596191406, -0.0150604248046875, -0.013548851013183594, -0.012037277221679688, -0.010525703430175781, -0.009014129638671875, -0.007502555847167969, -0.0059909820556640625, -0.004479408264160156, -0.00296783447265625, -0.0014562606811523438, 5.53131103515625e-05, 0.0015668869018554688, 0.003078460693359375, 0.004590034484863281, 0.0061016082763671875, 0.007613182067871094, 0.009124755859375, 0.010636329650878906, 0.012147903442382812, 0.013659477233886719, 0.015171051025390625, 0.01668262481689453, 0.018194198608398438, 0.019705772399902344, 0.02121734619140625, 0.022728919982910156, 0.024240493774414062, 0.02575206756591797, 0.027263641357421875, 0.02877521514892578, 0.030286788940429688, 0.031798362731933594, 0.0333099365234375, 0.034821510314941406, 0.03633308410644531, 0.03784465789794922, 0.039356231689453125, 0.04086780548095703, 0.04237937927246094, 0.043890953063964844, 0.04540252685546875, 0.046914100646972656, 0.04842567443847656, 0.04993724822998047, 0.051448822021484375, 0.05296039581298828, 0.05447196960449219, 0.055983543395996094, 0.0574951171875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 6.0, 12.0, 35.0, 137.0, 347.0, 314.0, 120.0, 28.0, 9.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0250244140625, -0.02444159984588623, -0.02385878562927246, -0.02327597141265869, -0.022693157196044922, -0.022110342979431152, -0.021527528762817383, -0.020944714546203613, -0.020361900329589844, -0.019779086112976074, -0.019196271896362305, -0.018613457679748535, -0.018030643463134766, -0.017447829246520996, -0.016865015029907227, -0.016282200813293457, -0.015699386596679688, -0.015116572380065918, -0.014533758163452148, -0.013950943946838379, -0.01336812973022461, -0.01278531551361084, -0.01220250129699707, -0.0116196870803833, -0.011036872863769531, -0.010454058647155762, -0.009871244430541992, -0.009288430213928223, -0.008705615997314453, -0.008122801780700684, -0.007539987564086914, -0.0069571733474731445, -0.006374359130859375, -0.0057915449142456055, -0.005208730697631836, -0.004625916481018066, -0.004043102264404297, -0.0034602880477905273, -0.002877473831176758, -0.0022946596145629883, -0.0017118453979492188, -0.0011290311813354492, -0.0005462169647216797, 3.6597251892089844e-05, 0.0006194114685058594, 0.001202225685119629, 0.0017850399017333984, 0.002367854118347168, 0.0029506683349609375, 0.003533482551574707, 0.0041162967681884766, 0.004699110984802246, 0.005281925201416016, 0.005864739418029785, 0.006447553634643555, 0.007030367851257324, 0.007613182067871094, 0.008195996284484863, 0.008778810501098633, 0.009361624717712402, 0.009944438934326172, 0.010527253150939941, 0.011110067367553711, 0.01169288158416748, 0.01227569580078125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 9.0, 7.0, 8.0, 23.0, 26.0, 24.0, 29.0, 57.0, 71.0, 81.0, 152.0, 188.0, 240.0, 411.0, 660.0, 1089.0, 2616.0, 10610.0, 95359.0, 748230.0, 166904.0, 15085.0, 3315.0, 1242.0, 650.0, 449.0, 256.0, 187.0, 159.0, 116.0, 67.0, 46.0, 39.0, 32.0, 31.0, 21.0, 19.0, 11.0, 7.0, 8.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.03173828125, -0.03079366683959961, -0.02984905242919922, -0.028904438018798828, -0.027959823608398438, -0.027015209197998047, -0.026070594787597656, -0.025125980377197266, -0.024181365966796875, -0.023236751556396484, -0.022292137145996094, -0.021347522735595703, -0.020402908325195312, -0.019458293914794922, -0.01851367950439453, -0.01756906509399414, -0.01662445068359375, -0.01567983627319336, -0.014735221862792969, -0.013790607452392578, -0.012845993041992188, -0.011901378631591797, -0.010956764221191406, -0.010012149810791016, -0.009067535400390625, -0.008122920989990234, -0.007178306579589844, -0.006233692169189453, -0.0052890777587890625, -0.004344463348388672, -0.0033998489379882812, -0.0024552345275878906, -0.0015106201171875, -0.0005660057067871094, 0.00037860870361328125, 0.0013232231140136719, 0.0022678375244140625, 0.003212451934814453, 0.004157066345214844, 0.005101680755615234, 0.006046295166015625, 0.006990909576416016, 0.007935523986816406, 0.008880138397216797, 0.009824752807617188, 0.010769367218017578, 0.011713981628417969, 0.01265859603881836, 0.01360321044921875, 0.01454782485961914, 0.015492439270019531, 0.016437053680419922, 0.017381668090820312, 0.018326282501220703, 0.019270896911621094, 0.020215511322021484, 0.021160125732421875, 0.022104740142822266, 0.023049354553222656, 0.023993968963623047, 0.024938583374023438, 0.025883197784423828, 0.02682781219482422, 0.02777242660522461, 0.028717041015625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 8.0, 7.0, 12.0, 16.0, 13.0, 27.0, 36.0, 27.0, 47.0, 66.0, 61.0, 59.0, 67.0, 61.0, 55.0, 62.0, 52.0, 47.0, 55.0, 45.0, 37.0, 27.0, 28.0, 13.0, 18.0, 7.0, 11.0, 6.0, 10.0, 7.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01386260986328125, -0.013416290283203125, -0.012969970703125, -0.012523651123046875, -0.01207733154296875, -0.011631011962890625, -0.0111846923828125, -0.010738372802734375, -0.01029205322265625, -0.009845733642578125, -0.0093994140625, -0.008953094482421875, -0.00850677490234375, -0.008060455322265625, -0.0076141357421875, -0.007167816162109375, -0.00672149658203125, -0.006275177001953125, -0.005828857421875, -0.005382537841796875, -0.00493621826171875, -0.004489898681640625, -0.0040435791015625, -0.003597259521484375, -0.00315093994140625, -0.002704620361328125, -0.00225830078125, -0.001811981201171875, -0.00136566162109375, -0.000919342041015625, -0.0004730224609375, -2.6702880859375e-05, 0.00041961669921875, 0.000865936279296875, 0.001312255859375, 0.001758575439453125, 0.00220489501953125, 0.002651214599609375, 0.0030975341796875, 0.003543853759765625, 0.00399017333984375, 0.004436492919921875, 0.0048828125, 0.005329132080078125, 0.00577545166015625, 0.006221771240234375, 0.0066680908203125, 0.007114410400390625, 0.00756072998046875, 0.008007049560546875, 0.008453369140625, 0.008899688720703125, 0.00934600830078125, 0.009792327880859375, 0.0102386474609375, 0.010684967041015625, 0.01113128662109375, 0.011577606201171875, 0.01202392578125, 0.012470245361328125, 0.01291656494140625, 0.013362884521484375, 0.0138092041015625, 0.014255523681640625, 0.01470184326171875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 5.0, 6.0, 6.0, 10.0, 16.0, 12.0, 21.0, 28.0, 34.0, 64.0, 113.0, 261.0, 577.0, 1830.0, 7479.0, 138670.0, 882653.0, 12720.0, 2550.0, 822.0, 321.0, 136.0, 76.0, 50.0, 21.0, 21.0, 18.0, 9.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047393798828125, -0.046082496643066406, -0.04477119445800781, -0.04345989227294922, -0.042148590087890625, -0.04083728790283203, -0.03952598571777344, -0.038214683532714844, -0.03690338134765625, -0.035592079162597656, -0.03428077697753906, -0.03296947479248047, -0.031658172607421875, -0.03034687042236328, -0.029035568237304688, -0.027724266052246094, -0.0264129638671875, -0.025101661682128906, -0.023790359497070312, -0.02247905731201172, -0.021167755126953125, -0.01985645294189453, -0.018545150756835938, -0.017233848571777344, -0.01592254638671875, -0.014611244201660156, -0.013299942016601562, -0.011988639831542969, -0.010677337646484375, -0.009366035461425781, -0.008054733276367188, -0.006743431091308594, -0.00543212890625, -0.004120826721191406, -0.0028095245361328125, -0.0014982223510742188, -0.000186920166015625, 0.0011243820190429688, 0.0024356842041015625, 0.0037469863891601562, 0.00505828857421875, 0.006369590759277344, 0.0076808929443359375, 0.008992195129394531, 0.010303497314453125, 0.011614799499511719, 0.012926101684570312, 0.014237403869628906, 0.0155487060546875, 0.016860008239746094, 0.018171310424804688, 0.01948261260986328, 0.020793914794921875, 0.02210521697998047, 0.023416519165039062, 0.024727821350097656, 0.02603912353515625, 0.027350425720214844, 0.028661727905273438, 0.02997303009033203, 0.031284332275390625, 0.03259563446044922, 0.03390693664550781, 0.035218238830566406, 0.036529541015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 11.0, 8.0, 16.0, 23.0, 24.0, 43.0, 86.0, 102.0, 183.0, 169.0, 99.0, 65.0, 45.0, 31.0, 24.0, 14.0, 14.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018906593322753906, -0.00018313899636268616, -0.00017721205949783325, -0.00017128512263298035, -0.00016535818576812744, -0.00015943124890327454, -0.00015350431203842163, -0.00014757737517356873, -0.00014165043830871582, -0.00013572350144386292, -0.00012979656457901, -0.0001238696277141571, -0.0001179426908493042, -0.0001120157539844513, -0.00010608881711959839, -0.00010016188025474548, -9.423494338989258e-05, -8.830800652503967e-05, -8.238106966018677e-05, -7.645413279533386e-05, -7.052719593048096e-05, -6.460025906562805e-05, -5.8673322200775146e-05, -5.274638533592224e-05, -4.6819448471069336e-05, -4.089251160621643e-05, -3.4965574741363525e-05, -2.903863787651062e-05, -2.3111701011657715e-05, -1.718476414680481e-05, -1.1257827281951904e-05, -5.330890417098999e-06, 5.960464477539062e-07, 6.5229833126068115e-06, 1.2449920177459717e-05, 1.8376857042312622e-05, 2.4303793907165527e-05, 3.0230730772018433e-05, 3.615766763687134e-05, 4.208460450172424e-05, 4.801154136657715e-05, 5.3938478231430054e-05, 5.986541509628296e-05, 6.579235196113586e-05, 7.171928882598877e-05, 7.764622569084167e-05, 8.357316255569458e-05, 8.950009942054749e-05, 9.542703628540039e-05, 0.0001013539731502533, 0.0001072809100151062, 0.0001132078468799591, 0.00011913478374481201, 0.00012506172060966492, 0.00013098865747451782, 0.00013691559433937073, 0.00014284253120422363, 0.00014876946806907654, 0.00015469640493392944, 0.00016062334179878235, 0.00016655027866363525, 0.00017247721552848816, 0.00017840415239334106, 0.00018433108925819397, 0.00019025802612304688]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 5.0, 11.0, 5.0, 9.0, 8.0, 11.0, 25.0, 19.0, 26.0, 47.0, 88.0, 137.0, 275.0, 643.0, 2081.0, 9835.0, 195130.0, 819532.0, 16472.0, 2637.0, 768.0, 312.0, 156.0, 96.0, 66.0, 51.0, 33.0, 22.0, 14.0, 10.0, 9.0, 3.0, 6.0, 4.0, 1.0, 1.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.032989501953125, -0.03210091590881348, -0.031212329864501953, -0.03032374382019043, -0.029435157775878906, -0.028546571731567383, -0.02765798568725586, -0.026769399642944336, -0.025880813598632812, -0.02499222755432129, -0.024103641510009766, -0.023215055465698242, -0.02232646942138672, -0.021437883377075195, -0.020549297332763672, -0.01966071128845215, -0.018772125244140625, -0.0178835391998291, -0.016994953155517578, -0.016106367111206055, -0.015217781066894531, -0.014329195022583008, -0.013440608978271484, -0.012552022933959961, -0.011663436889648438, -0.010774850845336914, -0.00988626480102539, -0.008997678756713867, -0.008109092712402344, -0.00722050666809082, -0.006331920623779297, -0.0054433345794677734, -0.00455474853515625, -0.0036661624908447266, -0.002777576446533203, -0.0018889904022216797, -0.0010004043579101562, -0.00011181831359863281, 0.0007767677307128906, 0.001665353775024414, 0.0025539398193359375, 0.003442525863647461, 0.004331111907958984, 0.005219697952270508, 0.006108283996582031, 0.006996870040893555, 0.007885456085205078, 0.008774042129516602, 0.009662628173828125, 0.010551214218139648, 0.011439800262451172, 0.012328386306762695, 0.013216972351074219, 0.014105558395385742, 0.014994144439697266, 0.01588273048400879, 0.016771316528320312, 0.017659902572631836, 0.01854848861694336, 0.019437074661254883, 0.020325660705566406, 0.02121424674987793, 0.022102832794189453, 0.022991418838500977, 0.0238800048828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 9.0, 7.0, 7.0, 9.0, 11.0, 13.0, 13.0, 22.0, 84.0, 163.0, 274.0, 196.0, 77.0, 38.0, 21.0, 15.0, 15.0, 4.0, 3.0, 3.0, 3.0, 4.0, 4.0, 0.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01406097412109375, -0.013676762580871582, -0.013292551040649414, -0.012908339500427246, -0.012524127960205078, -0.01213991641998291, -0.011755704879760742, -0.011371493339538574, -0.010987281799316406, -0.010603070259094238, -0.01021885871887207, -0.009834647178649902, -0.009450435638427734, -0.009066224098205566, -0.008682012557983398, -0.00829780101776123, -0.007913589477539062, -0.0075293779373168945, -0.0071451663970947266, -0.006760954856872559, -0.006376743316650391, -0.005992531776428223, -0.005608320236206055, -0.005224108695983887, -0.004839897155761719, -0.004455685615539551, -0.004071474075317383, -0.003687262535095215, -0.003303050994873047, -0.002918839454650879, -0.002534627914428711, -0.002150416374206543, -0.001766204833984375, -0.001381993293762207, -0.000997781753540039, -0.0006135702133178711, -0.00022935867309570312, 0.00015485286712646484, 0.0005390644073486328, 0.0009232759475708008, 0.0013074874877929688, 0.0016916990280151367, 0.0020759105682373047, 0.0024601221084594727, 0.0028443336486816406, 0.0032285451889038086, 0.0036127567291259766, 0.0039969682693481445, 0.0043811798095703125, 0.0047653913497924805, 0.0051496028900146484, 0.005533814430236816, 0.005918025970458984, 0.006302237510681152, 0.00668644905090332, 0.007070660591125488, 0.007454872131347656, 0.007839083671569824, 0.008223295211791992, 0.00860750675201416, 0.008991718292236328, 0.009375929832458496, 0.009760141372680664, 0.010144352912902832, 0.010528564453125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 44.0, 242.0, 514.0, 158.0, 27.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.20000746846199036, -0.19400620460510254, -0.18800494074821472, -0.1820036619901657, -0.1760023981332779, -0.17000113427639008, -0.16399985551834106, -0.15799859166145325, -0.15199732780456543, -0.1459960639476776, -0.1399948000907898, -0.13399352133274078, -0.12799225747585297, -0.12199099361896515, -0.11598972231149673, -0.10998845100402832, -0.1039871871471405, -0.09798592329025269, -0.09198465198278427, -0.08598338067531586, -0.07998211681842804, -0.07398085296154022, -0.06797958165407181, -0.06197831407189369, -0.055977046489715576, -0.04997577890753746, -0.043974511325359344, -0.03797324374318123, -0.03197197616100311, -0.025970708578824997, -0.01996944099664688, -0.013968173414468765, -0.00796690583229065, -0.0019656382501125336, 0.004035629332065582, 0.010036896914243698, 0.016038164496421814, 0.02203943207859993, 0.028040699660778046, 0.03404196724295616, 0.04004323482513428, 0.04604450240731239, 0.05204576998949051, 0.058047037571668625, 0.06404830515384674, 0.07004956901073456, 0.07605084031820297, 0.08205211162567139, 0.0880533754825592, 0.09405463933944702, 0.10005591064691544, 0.10605718195438385, 0.11205844581127167, 0.11805970966815948, 0.1240609809756279, 0.1300622522830963, 0.13606351613998413, 0.14206477999687195, 0.14806604385375977, 0.15406732261180878, 0.1600685864686966, 0.1660698503255844, 0.17207112908363342, 0.17807239294052124, 0.18407365679740906]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 14.0, 21.0, 26.0, 38.0, 59.0, 66.0, 77.0, 87.0, 91.0, 96.0, 91.0, 82.0, 68.0, 49.0, 37.0, 29.0, 23.0, 12.0, 10.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07388091087341309, -0.07148758322000504, -0.06909425556659698, -0.06670092791318893, -0.06430760025978088, -0.061914268881082535, -0.059520937502384186, -0.057127609848976135, -0.054734282195568085, -0.052340954542160034, -0.049947626888751984, -0.047554295510053635, -0.045160967856645584, -0.042767640203237534, -0.040374308824539185, -0.037980981171131134, -0.035587653517723083, -0.03319432586431503, -0.030800996348261833, -0.028407666832208633, -0.026014339178800583, -0.023621011525392532, -0.021227682009339333, -0.018834352493286133, -0.016441024839878082, -0.014047696255147457, -0.011654367670416832, -0.009261039085686207, -0.006867710500955582, -0.0044743819162249565, -0.0020810533314943314, 0.0003122761845588684, 0.002705603837966919, 0.005098932422697544, 0.007492261007428169, 0.009885589592158794, 0.01227891817688942, 0.014672246761620045, 0.01706557534635067, 0.01945890486240387, 0.02185223251581192, 0.02424556016921997, 0.02663888968527317, 0.02903221920132637, 0.03142554685473442, 0.03381887450814247, 0.03621220588684082, 0.03860553354024887, 0.04099886119365692, 0.04339218884706497, 0.04578551650047302, 0.04817884787917137, 0.05057217553257942, 0.05296550318598747, 0.05535883456468582, 0.05775216221809387, 0.06014548987150192, 0.06253881752490997, 0.06493214517831802, 0.06732547283172607, 0.06971880793571472, 0.07211213558912277, 0.07450546324253082, 0.07689879089593887, 0.07929211854934692]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 12.0, 31.0, 25.0, 44.0, 80.0, 138.0, 263.0, 593.0, 2661.0, 53849.0, 4121689.0, 11676.0, 2214.0, 683.0, 154.0, 73.0, 40.0, 23.0, 5.0, 7.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0543212890625, -0.05303835868835449, -0.051755428314208984, -0.05047249794006348, -0.04918956756591797, -0.04790663719177246, -0.04662370681762695, -0.045340776443481445, -0.04405784606933594, -0.04277491569519043, -0.04149198532104492, -0.040209054946899414, -0.038926124572753906, -0.0376431941986084, -0.03636026382446289, -0.03507733345031738, -0.033794403076171875, -0.03251147270202637, -0.03122854232788086, -0.02994561195373535, -0.028662681579589844, -0.027379751205444336, -0.026096820831298828, -0.02481389045715332, -0.023530960083007812, -0.022248029708862305, -0.020965099334716797, -0.01968216896057129, -0.01839923858642578, -0.017116308212280273, -0.015833377838134766, -0.014550447463989258, -0.01326751708984375, -0.011984586715698242, -0.010701656341552734, -0.009418725967407227, -0.008135795593261719, -0.006852865219116211, -0.005569934844970703, -0.004287004470825195, -0.0030040740966796875, -0.0017211437225341797, -0.0004382133483886719, 0.0008447170257568359, 0.0021276473999023438, 0.0034105777740478516, 0.004693508148193359, 0.005976438522338867, 0.007259368896484375, 0.008542299270629883, 0.00982522964477539, 0.011108160018920898, 0.012391090393066406, 0.013674020767211914, 0.014956951141357422, 0.01623988151550293, 0.017522811889648438, 0.018805742263793945, 0.020088672637939453, 0.02137160301208496, 0.02265453338623047, 0.023937463760375977, 0.025220394134521484, 0.026503324508666992, 0.0277862548828125]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 10.0, 16.0, 73.0, 208.0, 354.0, 241.0, 79.0, 22.0, 4.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0237579345703125, -0.02319943904876709, -0.02264094352722168, -0.02208244800567627, -0.02152395248413086, -0.02096545696258545, -0.02040696144104004, -0.01984846591949463, -0.01928997039794922, -0.01873147487640381, -0.0181729793548584, -0.01761448383331299, -0.017055988311767578, -0.016497492790222168, -0.015938997268676758, -0.015380501747131348, -0.014822006225585938, -0.014263510704040527, -0.013705015182495117, -0.013146519660949707, -0.012588024139404297, -0.012029528617858887, -0.011471033096313477, -0.010912537574768066, -0.010354042053222656, -0.009795546531677246, -0.009237051010131836, -0.008678555488586426, -0.008120059967041016, -0.0075615644454956055, -0.007003068923950195, -0.006444573402404785, -0.005886077880859375, -0.005327582359313965, -0.004769086837768555, -0.0042105913162231445, -0.0036520957946777344, -0.0030936002731323242, -0.002535104751586914, -0.001976609230041504, -0.0014181137084960938, -0.0008596181869506836, -0.00030112266540527344, 0.0002573728561401367, 0.0008158683776855469, 0.001374363899230957, 0.0019328594207763672, 0.0024913549423217773, 0.0030498504638671875, 0.0036083459854125977, 0.004166841506958008, 0.004725337028503418, 0.005283832550048828, 0.005842328071594238, 0.0064008235931396484, 0.006959319114685059, 0.007517814636230469, 0.008076310157775879, 0.008634805679321289, 0.0091933012008667, 0.00975179672241211, 0.01031029224395752, 0.01086878776550293, 0.01142728328704834, 0.01198577880859375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 12.0, 8.0, 18.0, 29.0, 39.0, 47.0, 80.0, 145.0, 206.0, 445.0, 981.0, 2975.0, 17275.0, 1151023.0, 2985868.0, 29013.0, 3848.0, 1160.0, 478.0, 262.0, 128.0, 72.0, 60.0, 26.0, 26.0, 18.0, 15.0, 5.0, 4.0, 3.0, 3.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0296630859375, -0.028884410858154297, -0.028105735778808594, -0.02732706069946289, -0.026548385620117188, -0.025769710540771484, -0.02499103546142578, -0.024212360382080078, -0.023433685302734375, -0.022655010223388672, -0.02187633514404297, -0.021097660064697266, -0.020318984985351562, -0.01954030990600586, -0.018761634826660156, -0.017982959747314453, -0.01720428466796875, -0.016425609588623047, -0.015646934509277344, -0.01486825942993164, -0.014089584350585938, -0.013310909271240234, -0.012532234191894531, -0.011753559112548828, -0.010974884033203125, -0.010196208953857422, -0.009417533874511719, -0.008638858795166016, -0.007860183715820312, -0.007081508636474609, -0.006302833557128906, -0.005524158477783203, -0.0047454833984375, -0.003966808319091797, -0.0031881332397460938, -0.0024094581604003906, -0.0016307830810546875, -0.0008521080017089844, -7.343292236328125e-05, 0.0007052421569824219, 0.001483917236328125, 0.002262592315673828, 0.0030412673950195312, 0.0038199424743652344, 0.0045986175537109375, 0.005377292633056641, 0.006155967712402344, 0.006934642791748047, 0.00771331787109375, 0.008491992950439453, 0.009270668029785156, 0.01004934310913086, 0.010828018188476562, 0.011606693267822266, 0.012385368347167969, 0.013164043426513672, 0.013942718505859375, 0.014721393585205078, 0.015500068664550781, 0.016278743743896484, 0.017057418823242188, 0.01783609390258789, 0.018614768981933594, 0.019393444061279297, 0.020172119140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 8.0, 8.0, 9.0, 14.0, 20.0, 17.0, 39.0, 36.0, 81.0, 112.0, 164.0, 235.0, 305.0, 429.0, 542.0, 537.0, 402.0, 318.0, 216.0, 160.0, 117.0, 78.0, 66.0, 42.0, 27.0, 28.0, 19.0, 8.0, 10.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00682830810546875, -0.006565570831298828, -0.006302833557128906, -0.006040096282958984, -0.0057773590087890625, -0.005514621734619141, -0.005251884460449219, -0.004989147186279297, -0.004726409912109375, -0.004463672637939453, -0.004200935363769531, -0.003938198089599609, -0.0036754608154296875, -0.0034127235412597656, -0.0031499862670898438, -0.002887248992919922, -0.00262451171875, -0.002361774444580078, -0.0020990371704101562, -0.0018362998962402344, -0.0015735626220703125, -0.0013108253479003906, -0.0010480880737304688, -0.0007853507995605469, -0.000522613525390625, -0.0002598762512207031, 2.86102294921875e-06, 0.0002655982971191406, 0.0005283355712890625, 0.0007910728454589844, 0.0010538101196289062, 0.0013165473937988281, 0.00157928466796875, 0.0018420219421386719, 0.0021047592163085938, 0.0023674964904785156, 0.0026302337646484375, 0.0028929710388183594, 0.0031557083129882812, 0.003418445587158203, 0.003681182861328125, 0.003943920135498047, 0.004206657409667969, 0.004469394683837891, 0.0047321319580078125, 0.004994869232177734, 0.005257606506347656, 0.005520343780517578, 0.0057830810546875, 0.006045818328857422, 0.006308555603027344, 0.006571292877197266, 0.0068340301513671875, 0.007096767425537109, 0.007359504699707031, 0.007622241973876953, 0.007884979248046875, 0.008147716522216797, 0.008410453796386719, 0.00867319107055664, 0.008935928344726562, 0.009198665618896484, 0.009461402893066406, 0.009724140167236328, 0.00998687744140625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 10.0, 53.0, 269.0, 425.0, 193.0, 35.0, 8.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10985051095485687, -0.10610388964414597, -0.10235727578401566, -0.09861065447330475, -0.09486403316259384, -0.09111741930246353, -0.08737079799175262, -0.08362418413162231, -0.07987756282091141, -0.0761309415102005, -0.07238432765007019, -0.06863770633935928, -0.06489108502864838, -0.061144471168518066, -0.05739784985780716, -0.05365123227238655, -0.049904610961675644, -0.046157993376255035, -0.04241137206554413, -0.03866475448012352, -0.03491813689470291, -0.031171517446637154, -0.027424897998571396, -0.023678280413150787, -0.01993166096508503, -0.016185041517019272, -0.012438423931598663, -0.008691804483532906, -0.0049451859667897224, -0.0011985674500465393, 0.0025480519980192184, 0.006294669583439827, 0.010041289031505585, 0.013787907548248768, 0.01753452606499195, 0.02128114551305771, 0.025027763098478317, 0.028774382546544075, 0.03252100199460983, 0.03626761958003044, 0.04001423716545105, 0.04376085475087166, 0.047507476061582565, 0.051254093647003174, 0.05500071123242378, 0.05874732881784439, 0.0624939501285553, 0.06624056398868561, 0.06998719274997711, 0.07373381406068802, 0.07748042792081833, 0.08122704923152924, 0.08497367054224014, 0.08872028440237045, 0.09246690571308136, 0.09621351957321167, 0.09996014088392258, 0.10370676219463348, 0.1074533760547638, 0.1111999973654747, 0.11494661867618561, 0.11869323253631592, 0.12243985384702682, 0.12618647515773773, 0.12993308901786804]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 7.0, 3.0, 5.0, 9.0, 8.0, 17.0, 18.0, 35.0, 21.0, 29.0, 29.0, 41.0, 36.0, 45.0, 46.0, 49.0, 48.0, 58.0, 46.0, 48.0, 54.0, 43.0, 40.0, 45.0, 48.0, 34.0, 24.0, 32.0, 21.0, 10.0, 16.0, 4.0, 12.0, 10.0, 4.0, 1.0, 6.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030046820640563965, -0.02914697304368019, -0.028247123584151268, -0.027347274124622345, -0.02644742652773857, -0.025547578930854797, -0.024647729471325874, -0.02374788001179695, -0.022848032414913177, -0.021948184818029404, -0.02104833535850048, -0.020148485898971558, -0.019248638302087784, -0.01834879070520401, -0.017448941245675087, -0.016549091786146164, -0.01564924418926239, -0.014749395661056042, -0.013849547132849693, -0.012949698604643345, -0.012049850076436996, -0.011150001548230648, -0.0102501530200243, -0.009350304491817951, -0.008450455963611603, -0.007550607435405254, -0.006650758907198906, -0.0057509103789925575, -0.004851061850786209, -0.003951213322579861, -0.0030513647943735123, -0.002151516266167164, -0.0012516677379608154, -0.000351819209754467, 0.0005480293184518814, 0.0014478778466582298, 0.0023477263748645782, 0.0032475749030709267, 0.004147423431277275, 0.0050472719594836235, 0.005947120487689972, 0.00684696901589632, 0.007746817544102669, 0.008646666072309017, 0.009546514600515366, 0.010446363128721714, 0.011346211656928062, 0.01224606018513441, 0.01314590871334076, 0.014045757241547108, 0.014945605769753456, 0.01584545522928238, 0.016745302826166153, 0.017645150423049927, 0.01854499988257885, 0.019444849342107773, 0.020344696938991547, 0.02124454453587532, 0.022144393995404243, 0.023044243454933167, 0.02394409105181694, 0.024843938648700714, 0.025743788108229637, 0.02664363756775856, 0.027543485164642334]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 2.0, 7.0, 7.0, 13.0, 17.0, 13.0, 19.0, 36.0, 33.0, 71.0, 93.0, 135.0, 211.0, 293.0, 497.0, 894.0, 3313.0, 144288.0, 882456.0, 12845.0, 1480.0, 663.0, 393.0, 236.0, 164.0, 121.0, 76.0, 63.0, 31.0, 25.0, 17.0, 12.0, 13.0, 5.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.05267333984375, -0.05113506317138672, -0.04959678649902344, -0.048058509826660156, -0.046520233154296875, -0.044981956481933594, -0.04344367980957031, -0.04190540313720703, -0.04036712646484375, -0.03882884979248047, -0.03729057312011719, -0.035752296447753906, -0.034214019775390625, -0.032675743103027344, -0.031137466430664062, -0.02959918975830078, -0.0280609130859375, -0.02652263641357422, -0.024984359741210938, -0.023446083068847656, -0.021907806396484375, -0.020369529724121094, -0.018831253051757812, -0.01729297637939453, -0.01575469970703125, -0.014216423034667969, -0.012678146362304688, -0.011139869689941406, -0.009601593017578125, -0.008063316345214844, -0.0065250396728515625, -0.004986763000488281, -0.003448486328125, -0.0019102096557617188, -0.0003719329833984375, 0.0011663436889648438, 0.002704620361328125, 0.004242897033691406, 0.0057811737060546875, 0.007319450378417969, 0.00885772705078125, 0.010396003723144531, 0.011934280395507812, 0.013472557067871094, 0.015010833740234375, 0.016549110412597656, 0.018087387084960938, 0.01962566375732422, 0.0211639404296875, 0.02270221710205078, 0.024240493774414062, 0.025778770446777344, 0.027317047119140625, 0.028855323791503906, 0.030393600463867188, 0.03193187713623047, 0.03347015380859375, 0.03500843048095703, 0.03654670715332031, 0.038084983825683594, 0.039623260498046875, 0.041161537170410156, 0.04269981384277344, 0.04423809051513672, 0.0457763671875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 7.0, 20.0, 65.0, 226.0, 353.0, 238.0, 79.0, 19.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0234222412109375, -0.02287137508392334, -0.02232050895690918, -0.02176964282989502, -0.02121877670288086, -0.0206679105758667, -0.02011704444885254, -0.01956617832183838, -0.01901531219482422, -0.01846444606781006, -0.0179135799407959, -0.01736271381378174, -0.016811847686767578, -0.016260981559753418, -0.015710115432739258, -0.015159249305725098, -0.014608383178710938, -0.014057517051696777, -0.013506650924682617, -0.012955784797668457, -0.012404918670654297, -0.011854052543640137, -0.011303186416625977, -0.010752320289611816, -0.010201454162597656, -0.009650588035583496, -0.009099721908569336, -0.008548855781555176, -0.007997989654541016, -0.0074471235275268555, -0.006896257400512695, -0.006345391273498535, -0.005794525146484375, -0.005243659019470215, -0.004692792892456055, -0.0041419267654418945, -0.0035910606384277344, -0.0030401945114135742, -0.002489328384399414, -0.001938462257385254, -0.0013875961303710938, -0.0008367300033569336, -0.00028586387634277344, 0.0002650022506713867, 0.0008158683776855469, 0.001366734504699707, 0.0019176006317138672, 0.0024684667587280273, 0.0030193328857421875, 0.0035701990127563477, 0.004121065139770508, 0.004671931266784668, 0.005222797393798828, 0.005773663520812988, 0.0063245296478271484, 0.006875395774841309, 0.007426261901855469, 0.007977128028869629, 0.008527994155883789, 0.00907886028289795, 0.00962972640991211, 0.01018059253692627, 0.01073145866394043, 0.01128232479095459, 0.01183319091796875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 8.0, 3.0, 3.0, 11.0, 5.0, 4.0, 7.0, 15.0, 15.0, 24.0, 33.0, 47.0, 44.0, 80.0, 86.0, 123.0, 207.0, 303.0, 409.0, 699.0, 1301.0, 3422.0, 17182.0, 268276.0, 700256.0, 45488.0, 5907.0, 1956.0, 903.0, 572.0, 325.0, 238.0, 158.0, 115.0, 79.0, 62.0, 46.0, 34.0, 33.0, 15.0, 20.0, 7.0, 8.0, 9.0, 11.0, 6.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0300140380859375, -0.029110193252563477, -0.028206348419189453, -0.02730250358581543, -0.026398658752441406, -0.025494813919067383, -0.02459096908569336, -0.023687124252319336, -0.022783279418945312, -0.02187943458557129, -0.020975589752197266, -0.020071744918823242, -0.01916790008544922, -0.018264055252075195, -0.017360210418701172, -0.01645636558532715, -0.015552520751953125, -0.014648675918579102, -0.013744831085205078, -0.012840986251831055, -0.011937141418457031, -0.011033296585083008, -0.010129451751708984, -0.009225606918334961, -0.008321762084960938, -0.007417917251586914, -0.006514072418212891, -0.005610227584838867, -0.004706382751464844, -0.0038025379180908203, -0.002898693084716797, -0.0019948482513427734, -0.00109100341796875, -0.00018715858459472656, 0.0007166862487792969, 0.0016205310821533203, 0.0025243759155273438, 0.003428220748901367, 0.004332065582275391, 0.005235910415649414, 0.0061397552490234375, 0.007043600082397461, 0.007947444915771484, 0.008851289749145508, 0.009755134582519531, 0.010658979415893555, 0.011562824249267578, 0.012466669082641602, 0.013370513916015625, 0.014274358749389648, 0.015178203582763672, 0.016082048416137695, 0.01698589324951172, 0.017889738082885742, 0.018793582916259766, 0.01969742774963379, 0.020601272583007812, 0.021505117416381836, 0.02240896224975586, 0.023312807083129883, 0.024216651916503906, 0.02512049674987793, 0.026024341583251953, 0.026928186416625977, 0.02783203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 8.0, 6.0, 6.0, 10.0, 22.0, 19.0, 17.0, 24.0, 24.0, 27.0, 38.0, 33.0, 49.0, 56.0, 63.0, 53.0, 59.0, 62.0, 39.0, 59.0, 48.0, 45.0, 43.0, 31.0, 30.0, 20.0, 18.0, 20.0, 10.0, 9.0, 7.0, 6.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.012603759765625, -0.012232780456542969, -0.011861801147460938, -0.011490821838378906, -0.011119842529296875, -0.010748863220214844, -0.010377883911132812, -0.010006904602050781, -0.00963592529296875, -0.009264945983886719, -0.008893966674804688, -0.008522987365722656, -0.008152008056640625, -0.007781028747558594, -0.0074100494384765625, -0.007039070129394531, -0.0066680908203125, -0.006297111511230469, -0.0059261322021484375, -0.005555152893066406, -0.005184173583984375, -0.004813194274902344, -0.0044422149658203125, -0.004071235656738281, -0.00370025634765625, -0.0033292770385742188, -0.0029582977294921875, -0.0025873184204101562, -0.002216339111328125, -0.0018453598022460938, -0.0014743804931640625, -0.0011034011840820312, -0.000732421875, -0.00036144256591796875, 9.5367431640625e-06, 0.00038051605224609375, 0.000751495361328125, 0.0011224746704101562, 0.0014934539794921875, 0.0018644332885742188, 0.00223541259765625, 0.0026063919067382812, 0.0029773712158203125, 0.0033483505249023438, 0.003719329833984375, 0.004090309143066406, 0.0044612884521484375, 0.004832267761230469, 0.0052032470703125, 0.005574226379394531, 0.0059452056884765625, 0.006316184997558594, 0.006687164306640625, 0.007058143615722656, 0.0074291229248046875, 0.007800102233886719, 0.00817108154296875, 0.008542060852050781, 0.008913040161132812, 0.009284019470214844, 0.009654998779296875, 0.010025978088378906, 0.010396957397460938, 0.010767936706542969, 0.011138916015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 13.0, 11.0, 17.0, 24.0, 29.0, 39.0, 46.0, 83.0, 173.0, 268.0, 574.0, 1230.0, 4119.0, 20729.0, 264295.0, 703240.0, 43405.0, 6758.0, 1872.0, 732.0, 331.0, 199.0, 129.0, 70.0, 50.0, 22.0, 20.0, 21.0, 14.0, 9.0, 6.0, 7.0, 2.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0120086669921875, -0.011667251586914062, -0.011325836181640625, -0.010984420776367188, -0.01064300537109375, -0.010301589965820312, -0.009960174560546875, -0.009618759155273438, -0.00927734375, -0.008935928344726562, -0.008594512939453125, -0.008253097534179688, -0.00791168212890625, -0.0075702667236328125, -0.007228851318359375, -0.0068874359130859375, -0.0065460205078125, -0.0062046051025390625, -0.005863189697265625, -0.0055217742919921875, -0.00518035888671875, -0.0048389434814453125, -0.004497528076171875, -0.0041561126708984375, -0.003814697265625, -0.0034732818603515625, -0.003131866455078125, -0.0027904510498046875, -0.00244903564453125, -0.0021076202392578125, -0.001766204833984375, -0.0014247894287109375, -0.0010833740234375, -0.0007419586181640625, -0.000400543212890625, -5.91278076171875e-05, 0.00028228759765625, 0.0006237030029296875, 0.000965118408203125, 0.0013065338134765625, 0.00164794921875, 0.0019893646240234375, 0.002330780029296875, 0.0026721954345703125, 0.00301361083984375, 0.0033550262451171875, 0.003696441650390625, 0.0040378570556640625, 0.0043792724609375, 0.0047206878662109375, 0.005062103271484375, 0.0054035186767578125, 0.00574493408203125, 0.0060863494873046875, 0.006427764892578125, 0.0067691802978515625, 0.007110595703125, 0.0074520111083984375, 0.007793426513671875, 0.008134841918945312, 0.00847625732421875, 0.008817672729492188, 0.009159088134765625, 0.009500503540039062, 0.0098419189453125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 10.0, 7.0, 9.0, 19.0, 24.0, 35.0, 47.0, 74.0, 92.0, 108.0, 108.0, 111.0, 85.0, 69.0, 45.0, 41.0, 29.0, 24.0, 14.0, 6.0, 7.0, 4.0, 3.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001016855239868164, -9.837653487920761e-05, -9.506754577159882e-05, -9.175855666399002e-05, -8.844956755638123e-05, -8.514057844877243e-05, -8.183158934116364e-05, -7.852260023355484e-05, -7.521361112594604e-05, -7.190462201833725e-05, -6.859563291072845e-05, -6.528664380311966e-05, -6.197765469551086e-05, -5.866866558790207e-05, -5.5359676480293274e-05, -5.205068737268448e-05, -4.8741698265075684e-05, -4.543270915746689e-05, -4.212372004985809e-05, -3.88147309422493e-05, -3.55057418346405e-05, -3.219675272703171e-05, -2.8887763619422913e-05, -2.5578774511814117e-05, -2.2269785404205322e-05, -1.8960796296596527e-05, -1.5651807188987732e-05, -1.2342818081378937e-05, -9.033828973770142e-06, -5.7248398661613464e-06, -2.4158507585525513e-06, 8.931383490562439e-07, 4.202127456665039e-06, 7.511116564273834e-06, 1.082010567188263e-05, 1.4129094779491425e-05, 1.743808388710022e-05, 2.0747072994709015e-05, 2.405606210231781e-05, 2.7365051209926605e-05, 3.06740403175354e-05, 3.3983029425144196e-05, 3.729201853275299e-05, 4.0601007640361786e-05, 4.390999674797058e-05, 4.7218985855579376e-05, 5.052797496318817e-05, 5.3836964070796967e-05, 5.714595317840576e-05, 6.045494228601456e-05, 6.376393139362335e-05, 6.707292050123215e-05, 7.038190960884094e-05, 7.369089871644974e-05, 7.699988782405853e-05, 8.030887693166733e-05, 8.361786603927612e-05, 8.692685514688492e-05, 9.023584425449371e-05, 9.354483336210251e-05, 9.68538224697113e-05, 0.0001001628115773201, 0.0001034718006849289, 0.00010678078979253769, 0.00011008977890014648]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 4.0, 6.0, 4.0, 4.0, 9.0, 9.0, 16.0, 14.0, 31.0, 49.0, 92.0, 137.0, 252.0, 498.0, 1421.0, 7543.0, 136228.0, 872829.0, 24645.0, 3066.0, 828.0, 396.0, 184.0, 110.0, 69.0, 44.0, 27.0, 20.0, 7.0, 3.0, 9.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0121307373046875, -0.011609077453613281, -0.011087417602539062, -0.010565757751464844, -0.010044097900390625, -0.009522438049316406, -0.009000778198242188, -0.008479118347167969, -0.00795745849609375, -0.007435798645019531, -0.0069141387939453125, -0.006392478942871094, -0.005870819091796875, -0.005349159240722656, -0.0048274993896484375, -0.004305839538574219, -0.0037841796875, -0.0032625198364257812, -0.0027408599853515625, -0.0022192001342773438, -0.001697540283203125, -0.0011758804321289062, -0.0006542205810546875, -0.00013256072998046875, 0.00038909912109375, 0.0009107589721679688, 0.0014324188232421875, 0.0019540786743164062, 0.002475738525390625, 0.0029973983764648438, 0.0035190582275390625, 0.004040718078613281, 0.0045623779296875, 0.005084037780761719, 0.0056056976318359375, 0.006127357482910156, 0.006649017333984375, 0.007170677185058594, 0.0076923370361328125, 0.008213996887207031, 0.00873565673828125, 0.009257316589355469, 0.009778976440429688, 0.010300636291503906, 0.010822296142578125, 0.011343955993652344, 0.011865615844726562, 0.012387275695800781, 0.012908935546875, 0.013430595397949219, 0.013952255249023438, 0.014473915100097656, 0.014995574951171875, 0.015517234802246094, 0.016038894653320312, 0.01656055450439453, 0.01708221435546875, 0.01760387420654297, 0.018125534057617188, 0.018647193908691406, 0.019168853759765625, 0.019690513610839844, 0.020212173461914062, 0.02073383331298828, 0.0212554931640625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 7.0, 9.0, 12.0, 11.0, 14.0, 24.0, 37.0, 43.0, 55.0, 73.0, 102.0, 162.0, 159.0, 72.0, 53.0, 41.0, 30.0, 15.0, 13.0, 12.0, 5.0, 8.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.006778717041015625, -0.006611347198486328, -0.006443977355957031, -0.006276607513427734, -0.0061092376708984375, -0.005941867828369141, -0.005774497985839844, -0.005607128143310547, -0.00543975830078125, -0.005272388458251953, -0.005105018615722656, -0.004937648773193359, -0.0047702789306640625, -0.004602909088134766, -0.004435539245605469, -0.004268169403076172, -0.004100799560546875, -0.003933429718017578, -0.0037660598754882812, -0.0035986900329589844, -0.0034313201904296875, -0.0032639503479003906, -0.0030965805053710938, -0.002929210662841797, -0.0027618408203125, -0.002594470977783203, -0.0024271011352539062, -0.0022597312927246094, -0.0020923614501953125, -0.0019249916076660156, -0.0017576217651367188, -0.0015902519226074219, -0.001422882080078125, -0.0012555122375488281, -0.0010881423950195312, -0.0009207725524902344, -0.0007534027099609375, -0.0005860328674316406, -0.00041866302490234375, -0.0002512931823730469, -8.392333984375e-05, 8.344650268554688e-05, 0.00025081634521484375, 0.0004181861877441406, 0.0005855560302734375, 0.0007529258728027344, 0.0009202957153320312, 0.0010876655578613281, 0.001255035400390625, 0.0014224052429199219, 0.0015897750854492188, 0.0017571449279785156, 0.0019245147705078125, 0.0020918846130371094, 0.0022592544555664062, 0.002426624298095703, 0.002593994140625, 0.002761363983154297, 0.0029287338256835938, 0.0030961036682128906, 0.0032634735107421875, 0.0034308433532714844, 0.0035982131958007812, 0.003765583038330078, 0.003932952880859375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 94.0, 615.0, 261.0, 27.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20587629079818726, -0.19957023859024048, -0.1932641863822937, -0.18695813417434692, -0.18065208196640015, -0.17434602975845337, -0.1680399775505066, -0.16173392534255981, -0.15542787313461304, -0.14912182092666626, -0.14281576871871948, -0.1365097165107727, -0.13020366430282593, -0.12389761209487915, -0.11759155988693237, -0.1112855076789856, -0.10497944802045822, -0.09867339581251144, -0.09236734360456467, -0.08606129139661789, -0.07975523918867111, -0.07344917953014374, -0.06714312732219696, -0.06083707883954048, -0.054531026631593704, -0.04822497442364693, -0.04191892221570015, -0.035612866282463074, -0.029306815937161446, -0.02300076186656952, -0.01669470965862274, -0.010388657450675964, -0.004082605242729187, 0.0022234474308788776, 0.008529500104486942, 0.014835553243756294, 0.02114160545170307, 0.027447659522294998, 0.033753711730241776, 0.04005976393818855, 0.04636581614613533, 0.05267186835408211, 0.058977920562028885, 0.06528397649526596, 0.07159002870321274, 0.07789608091115952, 0.08420213311910629, 0.09050818532705307, 0.09681423753499985, 0.10312028974294662, 0.1094263419508934, 0.11573239415884018, 0.12203844636678696, 0.12834450602531433, 0.1346505582332611, 0.14095661044120789, 0.14726266264915466, 0.15356871485710144, 0.15987476706504822, 0.166180819272995, 0.17248687148094177, 0.17879292368888855, 0.18509897589683533, 0.1914050281047821, 0.19771108031272888]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 6.0, 7.0, 8.0, 7.0, 16.0, 16.0, 20.0, 22.0, 33.0, 32.0, 35.0, 45.0, 45.0, 52.0, 49.0, 56.0, 63.0, 57.0, 62.0, 51.0, 59.0, 43.0, 35.0, 31.0, 33.0, 35.0, 24.0, 16.0, 13.0, 9.0, 8.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03747594356536865, -0.03637423366308212, -0.03527252376079559, -0.034170813858509064, -0.033069103956222534, -0.031967394053936005, -0.030865684151649475, -0.029763974249362946, -0.028662264347076416, -0.027560554444789886, -0.026458844542503357, -0.025357134640216827, -0.024255424737930298, -0.02315371483564377, -0.02205200493335724, -0.02095029503107071, -0.01984858512878418, -0.01874687522649765, -0.01764516532421112, -0.01654345542192459, -0.015441745519638062, -0.014340035617351532, -0.013238325715065002, -0.012136615812778473, -0.011034905910491943, -0.009933196008205414, -0.008831486105918884, -0.007729776203632355, -0.006628066301345825, -0.005526356399059296, -0.004424646496772766, -0.0033229365944862366, -0.002221226692199707, -0.0011195167899131775, -1.780688762664795e-05, 0.0010839030146598816, 0.002185612916946411, 0.0032873228192329407, 0.00438903272151947, 0.005490742623806, 0.006592452526092529, 0.007694162428379059, 0.008795872330665588, 0.009897582232952118, 0.010999292135238647, 0.012101002037525177, 0.013202711939811707, 0.014304421842098236, 0.015406131744384766, 0.016507841646671295, 0.017609551548957825, 0.018711261451244354, 0.019812971353530884, 0.020914681255817413, 0.022016391158103943, 0.023118101060390472, 0.024219810962677002, 0.02532152086496353, 0.02642323076725006, 0.02752494066953659, 0.02862665057182312, 0.02972836047410965, 0.03083007037639618, 0.03193178027868271, 0.03303349018096924]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 10.0, 13.0, 18.0, 31.0, 32.0, 42.0, 71.0, 80.0, 126.0, 175.0, 297.0, 524.0, 1241.0, 12779.0, 4102308.0, 70833.0, 3822.0, 1252.0, 287.0, 137.0, 91.0, 45.0, 19.0, 15.0, 6.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.047576904296875, -0.046244144439697266, -0.04491138458251953, -0.0435786247253418, -0.04224586486816406, -0.04091310501098633, -0.039580345153808594, -0.03824758529663086, -0.036914825439453125, -0.03558206558227539, -0.034249305725097656, -0.03291654586791992, -0.03158378601074219, -0.030251026153564453, -0.02891826629638672, -0.027585506439208984, -0.02625274658203125, -0.024919986724853516, -0.02358722686767578, -0.022254467010498047, -0.020921707153320312, -0.019588947296142578, -0.018256187438964844, -0.01692342758178711, -0.015590667724609375, -0.01425790786743164, -0.012925148010253906, -0.011592388153076172, -0.010259628295898438, -0.008926868438720703, -0.007594108581542969, -0.006261348724365234, -0.0049285888671875, -0.0035958290100097656, -0.0022630691528320312, -0.0009303092956542969, 0.0004024505615234375, 0.0017352104187011719, 0.0030679702758789062, 0.004400730133056641, 0.005733489990234375, 0.007066249847412109, 0.008399009704589844, 0.009731769561767578, 0.011064529418945312, 0.012397289276123047, 0.013730049133300781, 0.015062808990478516, 0.01639556884765625, 0.017728328704833984, 0.01906108856201172, 0.020393848419189453, 0.021726608276367188, 0.023059368133544922, 0.024392127990722656, 0.02572488784790039, 0.027057647705078125, 0.02839040756225586, 0.029723167419433594, 0.031055927276611328, 0.03238868713378906, 0.0337214469909668, 0.03505420684814453, 0.036386966705322266, 0.0377197265625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 11.0, 50.0, 147.0, 317.0, 324.0, 118.0, 32.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0227508544921875, -0.022220373153686523, -0.021689891815185547, -0.02115941047668457, -0.020628929138183594, -0.020098447799682617, -0.01956796646118164, -0.019037485122680664, -0.018507003784179688, -0.01797652244567871, -0.017446041107177734, -0.016915559768676758, -0.01638507843017578, -0.015854597091674805, -0.015324115753173828, -0.014793634414672852, -0.014263153076171875, -0.013732671737670898, -0.013202190399169922, -0.012671709060668945, -0.012141227722167969, -0.011610746383666992, -0.011080265045166016, -0.010549783706665039, -0.010019302368164062, -0.009488821029663086, -0.00895833969116211, -0.008427858352661133, -0.007897377014160156, -0.00736689567565918, -0.006836414337158203, -0.0063059329986572266, -0.00577545166015625, -0.0052449703216552734, -0.004714488983154297, -0.00418400764465332, -0.0036535263061523438, -0.003123044967651367, -0.0025925636291503906, -0.002062082290649414, -0.0015316009521484375, -0.001001119613647461, -0.0004706382751464844, 5.984306335449219e-05, 0.0005903244018554688, 0.0011208057403564453, 0.0016512870788574219, 0.0021817684173583984, 0.002712249755859375, 0.0032427310943603516, 0.003773212432861328, 0.004303693771362305, 0.004834175109863281, 0.005364656448364258, 0.005895137786865234, 0.006425619125366211, 0.0069561004638671875, 0.007486581802368164, 0.00801706314086914, 0.008547544479370117, 0.009078025817871094, 0.00960850715637207, 0.010138988494873047, 0.010669469833374023, 0.011199951171875]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 11.0, 14.0, 10.0, 22.0, 26.0, 53.0, 68.0, 91.0, 191.0, 345.0, 940.0, 4280.0, 247951.0, 3923341.0, 14102.0, 1712.0, 573.0, 237.0, 101.0, 53.0, 51.0, 29.0, 21.0, 16.0, 11.0, 14.0, 7.0, 4.0, 2.0, 2.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03875732421875, -0.037769317626953125, -0.03678131103515625, -0.035793304443359375, -0.0348052978515625, -0.033817291259765625, -0.03282928466796875, -0.031841278076171875, -0.030853271484375, -0.029865264892578125, -0.02887725830078125, -0.027889251708984375, -0.0269012451171875, -0.025913238525390625, -0.02492523193359375, -0.023937225341796875, -0.02294921875, -0.021961212158203125, -0.02097320556640625, -0.019985198974609375, -0.0189971923828125, -0.018009185791015625, -0.01702117919921875, -0.016033172607421875, -0.015045166015625, -0.014057159423828125, -0.01306915283203125, -0.012081146240234375, -0.0110931396484375, -0.010105133056640625, -0.00911712646484375, -0.008129119873046875, -0.00714111328125, -0.006153106689453125, -0.00516510009765625, -0.004177093505859375, -0.0031890869140625, -0.002201080322265625, -0.00121307373046875, -0.000225067138671875, 0.000762939453125, 0.001750946044921875, 0.00273895263671875, 0.003726959228515625, 0.0047149658203125, 0.005702972412109375, 0.00669097900390625, 0.007678985595703125, 0.0086669921875, 0.009654998779296875, 0.01064300537109375, 0.011631011962890625, 0.0126190185546875, 0.013607025146484375, 0.01459503173828125, 0.015583038330078125, 0.016571044921875, 0.017559051513671875, 0.01854705810546875, 0.019535064697265625, 0.0205230712890625, 0.021511077880859375, 0.02249908447265625, 0.023487091064453125, 0.02447509765625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 6.0, 5.0, 9.0, 16.0, 17.0, 22.0, 40.0, 61.0, 84.0, 162.0, 263.0, 445.0, 808.0, 808.0, 521.0, 269.0, 192.0, 125.0, 70.0, 57.0, 40.0, 19.0, 14.0, 10.0, 11.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0078125, -0.007512688636779785, -0.00721287727355957, -0.0069130659103393555, -0.006613254547119141, -0.006313443183898926, -0.006013631820678711, -0.005713820457458496, -0.005414009094238281, -0.005114197731018066, -0.0048143863677978516, -0.004514575004577637, -0.004214763641357422, -0.003914952278137207, -0.003615140914916992, -0.0033153295516967773, -0.0030155181884765625, -0.0027157068252563477, -0.002415895462036133, -0.002116084098815918, -0.0018162727355957031, -0.0015164613723754883, -0.0012166500091552734, -0.0009168386459350586, -0.0006170272827148438, -0.0003172159194946289, -1.7404556274414062e-05, 0.0002824068069458008, 0.0005822181701660156, 0.0008820295333862305, 0.0011818408966064453, 0.0014816522598266602, 0.001781463623046875, 0.00208127498626709, 0.0023810863494873047, 0.0026808977127075195, 0.0029807090759277344, 0.0032805204391479492, 0.003580331802368164, 0.003880143165588379, 0.004179954528808594, 0.004479765892028809, 0.0047795772552490234, 0.005079388618469238, 0.005379199981689453, 0.005679011344909668, 0.005978822708129883, 0.006278634071350098, 0.0065784454345703125, 0.006878256797790527, 0.007178068161010742, 0.007477879524230957, 0.007777690887451172, 0.008077502250671387, 0.008377313613891602, 0.008677124977111816, 0.008976936340332031, 0.009276747703552246, 0.009576559066772461, 0.009876370429992676, 0.01017618179321289, 0.010475993156433105, 0.01077580451965332, 0.011075615882873535, 0.01137542724609375]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 10.0, 53.0, 158.0, 310.0, 295.0, 112.0, 42.0, 13.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06732212007045746, -0.06505747884511948, -0.06279284507036209, -0.06052820384502411, -0.05826356261968613, -0.05599892511963844, -0.05373428761959076, -0.05146964639425278, -0.04920500889420509, -0.04694037139415741, -0.04467573016881943, -0.042411092668771744, -0.04014645516872406, -0.03788181394338608, -0.035617176443338394, -0.03335253894329071, -0.03108789771795273, -0.028823258355259895, -0.026558618992567062, -0.02429398149251938, -0.022029342129826546, -0.019764702767133713, -0.01750006526708603, -0.015235425904393196, -0.012970786541700363, -0.01070614717900753, -0.008441508747637272, -0.006176869850605726, -0.003912230953574181, -0.0016475915908813477, 0.0006170468404889107, 0.002881685271859169, 0.005146324634552002, 0.007410963531583548, 0.009675602428615093, 0.011940240859985352, 0.014204880222678185, 0.016469519585371017, 0.0187341570854187, 0.020998796448111534, 0.023263435810804367, 0.0255280751734972, 0.027792714536190033, 0.030057352036237717, 0.0323219895362854, 0.03458663076162338, 0.036851268261671066, 0.03911590576171875, 0.04138054698705673, 0.043645184487104416, 0.0459098257124424, 0.04817446321249008, 0.050439104437828064, 0.05270374193787575, 0.05496837943792343, 0.057233020663261414, 0.0594976581633091, 0.06176229566335678, 0.06402693688869476, 0.06629157811403275, 0.06855621188879013, 0.07082085311412811, 0.0730854943394661, 0.07535012811422348, 0.07761476933956146]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 6.0, 12.0, 15.0, 16.0, 23.0, 23.0, 28.0, 42.0, 49.0, 56.0, 52.0, 62.0, 57.0, 65.0, 64.0, 66.0, 57.0, 56.0, 43.0, 50.0, 35.0, 28.0, 26.0, 14.0, 12.0, 7.0, 9.0, 9.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.03581881523132324, -0.03491415083408356, -0.03400948643684387, -0.03310482203960419, -0.0322001576423645, -0.03129549324512482, -0.030390828847885132, -0.029486164450645447, -0.02858150005340576, -0.027676835656166077, -0.02677217125892639, -0.025867506861686707, -0.02496284246444702, -0.024058178067207336, -0.02315351366996765, -0.022248849272727966, -0.02134418487548828, -0.020439520478248596, -0.01953485608100891, -0.018630191683769226, -0.01772552728652954, -0.016820862889289856, -0.01591619849205017, -0.015011534094810486, -0.0141068696975708, -0.013202205300331116, -0.01229754090309143, -0.011392876505851746, -0.01048821210861206, -0.009583547711372375, -0.00867888331413269, -0.007774218916893005, -0.00686955451965332, -0.005964890122413635, -0.00506022572517395, -0.004155561327934265, -0.00325089693069458, -0.002346232533454895, -0.00144156813621521, -0.0005369037389755249, 0.00036776065826416016, 0.0012724250555038452, 0.0021770894527435303, 0.0030817538499832153, 0.0039864182472229, 0.0048910826444625854, 0.0057957470417022705, 0.006700411438941956, 0.007605075836181641, 0.008509740233421326, 0.00941440463066101, 0.010319069027900696, 0.01122373342514038, 0.012128397822380066, 0.013033062219619751, 0.013937726616859436, 0.014842391014099121, 0.015747055411338806, 0.01665171980857849, 0.017556384205818176, 0.01846104860305786, 0.019365713000297546, 0.02027037739753723, 0.021175041794776917, 0.0220797061920166]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 8.0, 6.0, 15.0, 10.0, 14.0, 13.0, 25.0, 27.0, 29.0, 58.0, 79.0, 100.0, 152.0, 199.0, 324.0, 552.0, 1045.0, 3581.0, 92436.0, 917980.0, 27342.0, 2198.0, 853.0, 449.0, 357.0, 218.0, 147.0, 83.0, 75.0, 43.0, 31.0, 18.0, 25.0, 15.0, 12.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.032196044921875, -0.031169414520263672, -0.030142784118652344, -0.029116153717041016, -0.028089523315429688, -0.02706289291381836, -0.02603626251220703, -0.025009632110595703, -0.023983001708984375, -0.022956371307373047, -0.02192974090576172, -0.02090311050415039, -0.019876480102539062, -0.018849849700927734, -0.017823219299316406, -0.016796588897705078, -0.01576995849609375, -0.014743328094482422, -0.013716697692871094, -0.012690067291259766, -0.011663436889648438, -0.01063680648803711, -0.009610176086425781, -0.008583545684814453, -0.007556915283203125, -0.006530284881591797, -0.005503654479980469, -0.004477024078369141, -0.0034503936767578125, -0.0024237632751464844, -0.0013971328735351562, -0.0003705024719238281, 0.0006561279296875, 0.0016827583312988281, 0.0027093887329101562, 0.0037360191345214844, 0.0047626495361328125, 0.005789279937744141, 0.006815910339355469, 0.007842540740966797, 0.008869171142578125, 0.009895801544189453, 0.010922431945800781, 0.01194906234741211, 0.012975692749023438, 0.014002323150634766, 0.015028953552246094, 0.016055583953857422, 0.01708221435546875, 0.018108844757080078, 0.019135475158691406, 0.020162105560302734, 0.021188735961914062, 0.02221536636352539, 0.02324199676513672, 0.024268627166748047, 0.025295257568359375, 0.026321887969970703, 0.02734851837158203, 0.02837514877319336, 0.029401779174804688, 0.030428409576416016, 0.031455039978027344, 0.03248167037963867, 0.03350830078125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 11.0, 75.0, 194.0, 387.0, 230.0, 82.0, 24.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0218048095703125, -0.021292686462402344, -0.020780563354492188, -0.02026844024658203, -0.019756317138671875, -0.01924419403076172, -0.018732070922851562, -0.018219947814941406, -0.01770782470703125, -0.017195701599121094, -0.016683578491210938, -0.01617145538330078, -0.015659332275390625, -0.015147209167480469, -0.014635086059570312, -0.014122962951660156, -0.01361083984375, -0.013098716735839844, -0.012586593627929688, -0.012074470520019531, -0.011562347412109375, -0.011050224304199219, -0.010538101196289062, -0.010025978088378906, -0.00951385498046875, -0.009001731872558594, -0.008489608764648438, -0.007977485656738281, -0.007465362548828125, -0.006953239440917969, -0.0064411163330078125, -0.005928993225097656, -0.0054168701171875, -0.004904747009277344, -0.0043926239013671875, -0.0038805007934570312, -0.003368377685546875, -0.0028562545776367188, -0.0023441314697265625, -0.0018320083618164062, -0.00131988525390625, -0.0008077621459960938, -0.0002956390380859375, 0.00021648406982421875, 0.000728607177734375, 0.0012407302856445312, 0.0017528533935546875, 0.0022649765014648438, 0.002777099609375, 0.0032892227172851562, 0.0038013458251953125, 0.004313468933105469, 0.004825592041015625, 0.005337715148925781, 0.0058498382568359375, 0.006361961364746094, 0.00687408447265625, 0.007386207580566406, 0.007898330688476562, 0.008410453796386719, 0.008922576904296875, 0.009434700012207031, 0.009946823120117188, 0.010458946228027344, 0.0109710693359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 12.0, 10.0, 17.0, 20.0, 19.0, 24.0, 38.0, 43.0, 55.0, 73.0, 99.0, 123.0, 163.0, 251.0, 409.0, 650.0, 1222.0, 3066.0, 11518.0, 61881.0, 354130.0, 485297.0, 103628.0, 17891.0, 4151.0, 1486.0, 766.0, 445.0, 297.0, 175.0, 158.0, 93.0, 67.0, 62.0, 63.0, 25.0, 34.0, 22.0, 12.0, 11.0, 13.0, 9.0, 9.0, 6.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0109100341796875, -0.010559678077697754, -0.010209321975708008, -0.009858965873718262, -0.009508609771728516, -0.00915825366973877, -0.008807897567749023, -0.008457541465759277, -0.008107185363769531, -0.007756829261779785, -0.007406473159790039, -0.007056117057800293, -0.006705760955810547, -0.006355404853820801, -0.006005048751831055, -0.005654692649841309, -0.0053043365478515625, -0.004953980445861816, -0.00460362434387207, -0.004253268241882324, -0.003902912139892578, -0.003552556037902832, -0.003202199935913086, -0.00285184383392334, -0.0025014877319335938, -0.0021511316299438477, -0.0018007755279541016, -0.0014504194259643555, -0.0011000633239746094, -0.0007497072219848633, -0.0003993511199951172, -4.8995018005371094e-05, 0.000301361083984375, 0.0006517171859741211, 0.0010020732879638672, 0.0013524293899536133, 0.0017027854919433594, 0.0020531415939331055, 0.0024034976959228516, 0.0027538537979125977, 0.0031042098999023438, 0.00345456600189209, 0.003804922103881836, 0.004155278205871582, 0.004505634307861328, 0.004855990409851074, 0.00520634651184082, 0.005556702613830566, 0.0059070587158203125, 0.006257414817810059, 0.006607770919799805, 0.006958127021789551, 0.007308483123779297, 0.007658839225769043, 0.008009195327758789, 0.008359551429748535, 0.008709907531738281, 0.009060263633728027, 0.009410619735717773, 0.00976097583770752, 0.010111331939697266, 0.010461688041687012, 0.010812044143676758, 0.011162400245666504, 0.01151275634765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 5.0, 5.0, 4.0, 4.0, 7.0, 5.0, 13.0, 16.0, 20.0, 24.0, 21.0, 25.0, 26.0, 32.0, 26.0, 45.0, 48.0, 37.0, 31.0, 44.0, 44.0, 42.0, 47.0, 39.0, 44.0, 39.0, 38.0, 31.0, 38.0, 32.0, 26.0, 17.0, 32.0, 17.0, 16.0, 9.0, 9.0, 13.0, 9.0, 7.0, 11.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007476806640625, -0.007230281829833984, -0.006983757019042969, -0.006737232208251953, -0.0064907073974609375, -0.006244182586669922, -0.005997657775878906, -0.005751132965087891, -0.005504608154296875, -0.005258083343505859, -0.005011558532714844, -0.004765033721923828, -0.0045185089111328125, -0.004271984100341797, -0.004025459289550781, -0.0037789344787597656, -0.00353240966796875, -0.0032858848571777344, -0.0030393600463867188, -0.002792835235595703, -0.0025463104248046875, -0.002299785614013672, -0.0020532608032226562, -0.0018067359924316406, -0.001560211181640625, -0.0013136863708496094, -0.0010671615600585938, -0.0008206367492675781, -0.0005741119384765625, -0.0003275871276855469, -8.106231689453125e-05, 0.00016546249389648438, 0.0004119873046875, 0.0006585121154785156, 0.0009050369262695312, 0.0011515617370605469, 0.0013980865478515625, 0.0016446113586425781, 0.0018911361694335938, 0.0021376609802246094, 0.002384185791015625, 0.0026307106018066406, 0.0028772354125976562, 0.003123760223388672, 0.0033702850341796875, 0.003616809844970703, 0.0038633346557617188, 0.004109859466552734, 0.00435638427734375, 0.004602909088134766, 0.004849433898925781, 0.005095958709716797, 0.0053424835205078125, 0.005589008331298828, 0.005835533142089844, 0.006082057952880859, 0.006328582763671875, 0.006575107574462891, 0.006821632385253906, 0.007068157196044922, 0.0073146820068359375, 0.007561206817626953, 0.007807731628417969, 0.008054256439208984, 0.00830078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 9.0, 5.0, 5.0, 11.0, 14.0, 28.0, 40.0, 68.0, 135.0, 234.0, 430.0, 948.0, 1932.0, 4503.0, 12182.0, 56099.0, 518248.0, 392781.0, 43073.0, 10498.0, 3848.0, 1682.0, 820.0, 410.0, 205.0, 134.0, 69.0, 44.0, 34.0, 17.0, 15.0, 11.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0052490234375, -0.005084633827209473, -0.004920244216918945, -0.004755854606628418, -0.004591464996337891, -0.004427075386047363, -0.004262685775756836, -0.004098296165466309, -0.003933906555175781, -0.003769516944885254, -0.0036051273345947266, -0.0034407377243041992, -0.003276348114013672, -0.0031119585037231445, -0.002947568893432617, -0.00278317928314209, -0.0026187896728515625, -0.002454400062561035, -0.002290010452270508, -0.0021256208419799805, -0.001961231231689453, -0.0017968416213989258, -0.0016324520111083984, -0.001468062400817871, -0.0013036727905273438, -0.0011392831802368164, -0.0009748935699462891, -0.0008105039596557617, -0.0006461143493652344, -0.00048172473907470703, -0.0003173351287841797, -0.00015294551849365234, 1.1444091796875e-05, 0.00017583370208740234, 0.0003402233123779297, 0.000504612922668457, 0.0006690025329589844, 0.0008333921432495117, 0.000997781753540039, 0.0011621713638305664, 0.0013265609741210938, 0.001490950584411621, 0.0016553401947021484, 0.0018197298049926758, 0.001984119415283203, 0.0021485090255737305, 0.002312898635864258, 0.002477288246154785, 0.0026416778564453125, 0.00280606746673584, 0.002970457077026367, 0.0031348466873168945, 0.003299236297607422, 0.0034636259078979492, 0.0036280155181884766, 0.003792405128479004, 0.003956794738769531, 0.004121184349060059, 0.004285573959350586, 0.004449963569641113, 0.004614353179931641, 0.004778742790222168, 0.004943132400512695, 0.005107522010803223, 0.00527191162109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 6.0, 2.0, 6.0, 13.0, 8.0, 18.0, 27.0, 33.0, 49.0, 60.0, 95.0, 136.0, 151.0, 112.0, 92.0, 62.0, 36.0, 28.0, 23.0, 15.0, 11.0, 11.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001646280288696289, -0.00016083288937807083, -0.00015703774988651276, -0.00015324261039495468, -0.0001494474709033966, -0.00014565233141183853, -0.00014185719192028046, -0.00013806205242872238, -0.0001342669129371643, -0.00013047177344560623, -0.00012667663395404816, -0.00012288149446249008, -0.00011908635497093201, -0.00011529121547937393, -0.00011149607598781586, -0.00010770093649625778, -0.00010390579700469971, -0.00010011065751314163, -9.631551802158356e-05, -9.252037853002548e-05, -8.872523903846741e-05, -8.493009954690933e-05, -8.113496005535126e-05, -7.733982056379318e-05, -7.354468107223511e-05, -6.974954158067703e-05, -6.595440208911896e-05, -6.215926259756088e-05, -5.836412310600281e-05, -5.456898361444473e-05, -5.077384412288666e-05, -4.697870463132858e-05, -4.318356513977051e-05, -3.938842564821243e-05, -3.559328615665436e-05, -3.179814666509628e-05, -2.8003007173538208e-05, -2.4207867681980133e-05, -2.0412728190422058e-05, -1.6617588698863983e-05, -1.2822449207305908e-05, -9.027309715747833e-06, -5.232170224189758e-06, -1.4370307326316833e-06, 2.3581087589263916e-06, 6.1532482504844666e-06, 9.948387742042542e-06, 1.3743527233600616e-05, 1.753866672515869e-05, 2.1333806216716766e-05, 2.512894570827484e-05, 2.8924085199832916e-05, 3.271922469139099e-05, 3.6514364182949066e-05, 4.030950367450714e-05, 4.4104643166065216e-05, 4.789978265762329e-05, 5.1694922149181366e-05, 5.549006164073944e-05, 5.9285201132297516e-05, 6.308034062385559e-05, 6.687548011541367e-05, 7.067061960697174e-05, 7.446575909852982e-05, 7.826089859008789e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 7.0, 8.0, 13.0, 14.0, 23.0, 38.0, 40.0, 68.0, 140.0, 320.0, 682.0, 2003.0, 8007.0, 84149.0, 879788.0, 63131.0, 6964.0, 1808.0, 671.0, 276.0, 162.0, 84.0, 46.0, 31.0, 27.0, 14.0, 5.0, 5.0, 7.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01100921630859375, -0.010722935199737549, -0.010436654090881348, -0.010150372982025146, -0.009864091873168945, -0.009577810764312744, -0.009291529655456543, -0.009005248546600342, -0.00871896743774414, -0.00843268632888794, -0.008146405220031738, -0.007860124111175537, -0.007573843002319336, -0.007287561893463135, -0.007001280784606934, -0.006714999675750732, -0.006428718566894531, -0.00614243745803833, -0.005856156349182129, -0.005569875240325928, -0.0052835941314697266, -0.004997313022613525, -0.004711031913757324, -0.004424750804901123, -0.004138469696044922, -0.0038521885871887207, -0.0035659074783325195, -0.0032796263694763184, -0.002993345260620117, -0.002707064151763916, -0.002420783042907715, -0.0021345019340515137, -0.0018482208251953125, -0.0015619397163391113, -0.0012756586074829102, -0.000989377498626709, -0.0007030963897705078, -0.00041681528091430664, -0.00013053417205810547, 0.0001557469367980957, 0.0004420280456542969, 0.000728309154510498, 0.0010145902633666992, 0.0013008713722229004, 0.0015871524810791016, 0.0018734335899353027, 0.002159714698791504, 0.002445995807647705, 0.0027322769165039062, 0.0030185580253601074, 0.0033048391342163086, 0.0035911202430725098, 0.003877401351928711, 0.004163682460784912, 0.004449963569641113, 0.0047362446784973145, 0.005022525787353516, 0.005308806896209717, 0.005595088005065918, 0.005881369113922119, 0.00616765022277832, 0.0064539313316345215, 0.006740212440490723, 0.007026493549346924, 0.007312774658203125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 4.0, 2.0, 4.0, 5.0, 12.0, 6.0, 14.0, 22.0, 26.0, 40.0, 53.0, 79.0, 89.0, 113.0, 116.0, 89.0, 85.0, 71.0, 63.0, 31.0, 26.0, 15.0, 9.0, 2.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004467010498046875, -0.004340678453445435, -0.004214346408843994, -0.004088014364242554, -0.003961682319641113, -0.003835350275039673, -0.0037090182304382324, -0.003582686185836792, -0.0034563541412353516, -0.003330022096633911, -0.0032036900520324707, -0.0030773580074310303, -0.00295102596282959, -0.0028246939182281494, -0.002698361873626709, -0.0025720298290252686, -0.002445697784423828, -0.0023193657398223877, -0.0021930336952209473, -0.002066701650619507, -0.0019403696060180664, -0.001814037561416626, -0.0016877055168151855, -0.0015613734722137451, -0.0014350414276123047, -0.0013087093830108643, -0.0011823773384094238, -0.0010560452938079834, -0.000929713249206543, -0.0008033812046051025, -0.0006770491600036621, -0.0005507171154022217, -0.00042438507080078125, -0.0002980530261993408, -0.0001717209815979004, -4.538893699645996e-05, 8.094310760498047e-05, 0.0002072751522064209, 0.00033360719680786133, 0.00045993924140930176, 0.0005862712860107422, 0.0007126033306121826, 0.000838935375213623, 0.0009652674198150635, 0.001091599464416504, 0.0012179315090179443, 0.0013442635536193848, 0.0014705955982208252, 0.0015969276428222656, 0.001723259687423706, 0.0018495917320251465, 0.001975923776626587, 0.0021022558212280273, 0.0022285878658294678, 0.002354919910430908, 0.0024812519550323486, 0.002607583999633789, 0.0027339160442352295, 0.00286024808883667, 0.0029865801334381104, 0.0031129121780395508, 0.003239244222640991, 0.0033655762672424316, 0.003491908311843872, 0.0036182403564453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 7.0, 39.0, 186.0, 475.0, 246.0, 38.0, 12.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15255309641361237, -0.14921241998672485, -0.14587172865867615, -0.14253105223178864, -0.13919036090373993, -0.13584968447685242, -0.1325089931488037, -0.1291683167219162, -0.1258276253938675, -0.12248694151639938, -0.11914625763893127, -0.11580557376146317, -0.11246488988399506, -0.10912420600652695, -0.10578352212905884, -0.10244284570217133, -0.09910216182470322, -0.09576147794723511, -0.092420794069767, -0.08908011019229889, -0.08573942631483078, -0.08239874243736267, -0.07905806601047516, -0.07571737468242645, -0.07237669825553894, -0.06903601437807083, -0.06569533050060272, -0.06235464662313461, -0.059013962745666504, -0.055673278868198395, -0.052332598716020584, -0.048991914838552475, -0.045651234686374664, -0.042310550808906555, -0.038969866931438446, -0.03562918305397034, -0.03228849917650223, -0.028947817161679268, -0.025607135146856308, -0.0222664512693882, -0.01892576739192009, -0.01558508351445198, -0.012244400568306446, -0.008903717622160912, -0.005563033744692802, -0.0022223498672246933, 0.0011183321475982666, 0.004459016025066376, 0.007799699902534485, 0.011140383780002594, 0.014481066726148129, 0.017821749672293663, 0.021162433549761772, 0.02450311742722988, 0.02784379944205284, 0.03118448331952095, 0.03452516719698906, 0.03786585107445717, 0.04120653495192528, 0.04454721510410309, 0.0478878989815712, 0.05122858285903931, 0.054569266736507416, 0.057909950613975525, 0.061250634491443634]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 11.0, 20.0, 26.0, 37.0, 38.0, 49.0, 52.0, 58.0, 70.0, 76.0, 77.0, 78.0, 67.0, 61.0, 33.0, 48.0, 38.0, 38.0, 22.0, 24.0, 15.0, 16.0, 13.0, 7.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03255683183670044, -0.031247559934854507, -0.029938289895653725, -0.028629019856452942, -0.02731974795460701, -0.026010476052761078, -0.024701206013560295, -0.023391935974359512, -0.02208266407251358, -0.02077339217066765, -0.019464122131466866, -0.018154852092266083, -0.01684558019042015, -0.015536309219896793, -0.014227038249373436, -0.012917767278850079, -0.011608496308326721, -0.010299225337803364, -0.008989954367280006, -0.007680683396756649, -0.006371412426233292, -0.005062141455709934, -0.003752870485186577, -0.0024435995146632195, -0.001134328544139862, 0.00017494242638349533, 0.0014842133969068527, 0.00279348436743021, 0.0041027553379535675, 0.005412026308476925, 0.006721297279000282, 0.00803056824952364, 0.009339839220046997, 0.010649110190570354, 0.011958381161093712, 0.01326765213161707, 0.014576923102140427, 0.01588619500398636, 0.01719546504318714, 0.018504735082387924, 0.019814006984233856, 0.021123278886079788, 0.02243254892528057, 0.023741818964481354, 0.025051090866327286, 0.026360362768173218, 0.027669632807374, 0.028978902846574783, 0.030288174748420715, 0.03159744665026665, 0.03290671855211258, 0.03421598672866821, 0.035525258630514145, 0.03683453053236008, 0.03814379870891571, 0.03945307061076164, 0.040762342512607574, 0.042071614414453506, 0.04338088631629944, 0.04469015449285507, 0.045999426394701004, 0.047308698296546936, 0.04861796647310257, 0.0499272383749485, 0.051236510276794434]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 10.0, 7.0, 11.0, 12.0, 13.0, 27.0, 29.0, 38.0, 49.0, 75.0, 124.0, 202.0, 292.0, 469.0, 957.0, 6804.0, 2161282.0, 2014043.0, 6473.0, 2355.0, 572.0, 170.0, 116.0, 53.0, 29.0, 20.0, 7.0, 12.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.04541015625, -0.04427480697631836, -0.04313945770263672, -0.04200410842895508, -0.04086875915527344, -0.0397334098815918, -0.038598060607910156, -0.037462711334228516, -0.036327362060546875, -0.035192012786865234, -0.034056663513183594, -0.03292131423950195, -0.03178596496582031, -0.030650615692138672, -0.02951526641845703, -0.02837991714477539, -0.02724456787109375, -0.02610921859741211, -0.02497386932373047, -0.023838520050048828, -0.022703170776367188, -0.021567821502685547, -0.020432472229003906, -0.019297122955322266, -0.018161773681640625, -0.017026424407958984, -0.015891075134277344, -0.014755725860595703, -0.013620376586914062, -0.012485027313232422, -0.011349678039550781, -0.01021432876586914, -0.0090789794921875, -0.00794363021850586, -0.006808280944824219, -0.005672931671142578, -0.0045375823974609375, -0.003402233123779297, -0.0022668838500976562, -0.0011315345764160156, 3.814697265625e-06, 0.0011391639709472656, 0.0022745132446289062, 0.003409862518310547, 0.0045452117919921875, 0.005680561065673828, 0.006815910339355469, 0.00795125961303711, 0.00908660888671875, 0.01022195816040039, 0.011357307434082031, 0.012492656707763672, 0.013628005981445312, 0.014763355255126953, 0.015898704528808594, 0.017034053802490234, 0.018169403076171875, 0.019304752349853516, 0.020440101623535156, 0.021575450897216797, 0.022710800170898438, 0.023846149444580078, 0.02498149871826172, 0.02611684799194336, 0.027252197265625]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 27.0, 100.0, 315.0, 356.0, 144.0, 51.0, 9.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0228271484375, -0.022298336029052734, -0.02176952362060547, -0.021240711212158203, -0.020711898803710938, -0.020183086395263672, -0.019654273986816406, -0.01912546157836914, -0.018596649169921875, -0.01806783676147461, -0.017539024353027344, -0.017010211944580078, -0.016481399536132812, -0.015952587127685547, -0.015423774719238281, -0.014894962310791016, -0.01436614990234375, -0.013837337493896484, -0.013308525085449219, -0.012779712677001953, -0.012250900268554688, -0.011722087860107422, -0.011193275451660156, -0.01066446304321289, -0.010135650634765625, -0.00960683822631836, -0.009078025817871094, -0.008549213409423828, -0.008020401000976562, -0.007491588592529297, -0.006962776184082031, -0.006433963775634766, -0.0059051513671875, -0.005376338958740234, -0.004847526550292969, -0.004318714141845703, -0.0037899017333984375, -0.003261089324951172, -0.0027322769165039062, -0.0022034645080566406, -0.001674652099609375, -0.0011458396911621094, -0.0006170272827148438, -8.821487426757812e-05, 0.0004405975341796875, 0.0009694099426269531, 0.0014982223510742188, 0.0020270347595214844, 0.00255584716796875, 0.0030846595764160156, 0.0036134719848632812, 0.004142284393310547, 0.0046710968017578125, 0.005199909210205078, 0.005728721618652344, 0.006257534027099609, 0.006786346435546875, 0.007315158843994141, 0.007843971252441406, 0.008372783660888672, 0.008901596069335938, 0.009430408477783203, 0.009959220886230469, 0.010488033294677734, 0.011016845703125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 4.0, 13.0, 24.0, 29.0, 35.0, 67.0, 117.0, 224.0, 661.0, 2796.0, 103408.0, 4071135.0, 13384.0, 1450.0, 446.0, 200.0, 105.0, 64.0, 38.0, 16.0, 19.0, 6.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.037353515625, -0.03637838363647461, -0.03540325164794922, -0.03442811965942383, -0.03345298767089844, -0.03247785568237305, -0.031502723693847656, -0.030527591705322266, -0.029552459716796875, -0.028577327728271484, -0.027602195739746094, -0.026627063751220703, -0.025651931762695312, -0.024676799774169922, -0.02370166778564453, -0.02272653579711914, -0.02175140380859375, -0.02077627182006836, -0.01980113983154297, -0.018826007843017578, -0.017850875854492188, -0.016875743865966797, -0.015900611877441406, -0.014925479888916016, -0.013950347900390625, -0.012975215911865234, -0.012000083923339844, -0.011024951934814453, -0.010049819946289062, -0.009074687957763672, -0.008099555969238281, -0.007124423980712891, -0.0061492919921875, -0.005174160003662109, -0.004199028015136719, -0.003223896026611328, -0.0022487640380859375, -0.0012736320495605469, -0.00029850006103515625, 0.0006766319274902344, 0.001651763916015625, 0.0026268959045410156, 0.0036020278930664062, 0.004577159881591797, 0.0055522918701171875, 0.006527423858642578, 0.007502555847167969, 0.00847768783569336, 0.00945281982421875, 0.01042795181274414, 0.011403083801269531, 0.012378215789794922, 0.013353347778320312, 0.014328479766845703, 0.015303611755371094, 0.016278743743896484, 0.017253875732421875, 0.018229007720947266, 0.019204139709472656, 0.020179271697998047, 0.021154403686523438, 0.022129535675048828, 0.02310466766357422, 0.02407979965209961, 0.025054931640625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 3.0, 5.0, 6.0, 8.0, 19.0, 23.0, 39.0, 61.0, 105.0, 146.0, 240.0, 480.0, 844.0, 917.0, 454.0, 293.0, 145.0, 104.0, 64.0, 34.0, 27.0, 21.0, 18.0, 6.0, 2.0, 3.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00850677490234375, -0.00824117660522461, -0.007975578308105469, -0.007709980010986328, -0.0074443817138671875, -0.007178783416748047, -0.006913185119628906, -0.006647586822509766, -0.006381988525390625, -0.006116390228271484, -0.005850791931152344, -0.005585193634033203, -0.0053195953369140625, -0.005053997039794922, -0.004788398742675781, -0.004522800445556641, -0.0042572021484375, -0.003991603851318359, -0.0037260055541992188, -0.003460407257080078, -0.0031948089599609375, -0.002929210662841797, -0.0026636123657226562, -0.0023980140686035156, -0.002132415771484375, -0.0018668174743652344, -0.0016012191772460938, -0.0013356208801269531, -0.0010700225830078125, -0.0008044242858886719, -0.0005388259887695312, -0.0002732276916503906, -7.62939453125e-06, 0.0002579689025878906, 0.0005235671997070312, 0.0007891654968261719, 0.0010547637939453125, 0.0013203620910644531, 0.0015859603881835938, 0.0018515586853027344, 0.002117156982421875, 0.0023827552795410156, 0.0026483535766601562, 0.002913951873779297, 0.0031795501708984375, 0.003445148468017578, 0.0037107467651367188, 0.003976345062255859, 0.004241943359375, 0.004507541656494141, 0.004773139953613281, 0.005038738250732422, 0.0053043365478515625, 0.005569934844970703, 0.005835533142089844, 0.006101131439208984, 0.006366729736328125, 0.006632328033447266, 0.006897926330566406, 0.007163524627685547, 0.0074291229248046875, 0.007694721221923828, 0.007960319519042969, 0.00822591781616211, 0.00849151611328125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 10.0, 23.0, 138.0, 341.0, 339.0, 111.0, 29.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04533467814326286, -0.04292302951216698, -0.04051138088107109, -0.038099732249975204, -0.03568808734416962, -0.03327643871307373, -0.030864790081977844, -0.028453141450881958, -0.026041492819786072, -0.023629844188690186, -0.0212181955575943, -0.018806548789143562, -0.016394900158047676, -0.01398325152695179, -0.011571603827178478, -0.009159956127405167, -0.00674830749630928, -0.0043366593308746815, -0.0019250111654400826, 0.00048663699999451637, 0.0028982851654291153, 0.0053099337965250015, 0.007721581496298313, 0.010133229196071625, 0.012544877827167511, 0.014956526458263397, 0.017368175089359283, 0.01977982185781002, 0.022191470488905907, 0.024603119120001793, 0.02701476588845253, 0.029426414519548416, 0.0318380668759346, 0.03424971550703049, 0.03666136413812637, 0.03907301276922226, 0.041484661400318146, 0.04389631003141403, 0.04630795493721962, 0.048719603568315506, 0.05113125219941139, 0.05354290083050728, 0.055954549461603165, 0.05836619809269905, 0.06077784299850464, 0.06318949162960052, 0.06560114026069641, 0.0680127888917923, 0.07042443752288818, 0.07283608615398407, 0.07524773478507996, 0.07765938341617584, 0.08007103204727173, 0.08248268067836761, 0.0848943293094635, 0.08730597794055939, 0.08971762657165527, 0.09212927520275116, 0.09454092383384705, 0.09695257246494293, 0.09936422109603882, 0.1017758697271347, 0.10418751835823059, 0.10659916698932648, 0.10901080816984177]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 8.0, 12.0, 18.0, 17.0, 28.0, 24.0, 32.0, 39.0, 46.0, 41.0, 51.0, 53.0, 62.0, 65.0, 53.0, 39.0, 58.0, 44.0, 56.0, 47.0, 36.0, 26.0, 21.0, 24.0, 24.0, 14.0, 13.0, 10.0, 8.0, 4.0, 6.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02054530382156372, -0.01976127177476883, -0.01897723786532879, -0.018193203955888748, -0.017409171909093857, -0.016625139862298965, -0.015841105952858925, -0.015057072974741459, -0.014273039996623993, -0.013489007018506527, -0.012704974040389061, -0.011920941062271595, -0.011136908084154129, -0.010352875106036663, -0.009568842127919197, -0.008784809149801731, -0.008000776171684265, -0.007216743193566799, -0.006432710215449333, -0.005648677237331867, -0.004864644259214401, -0.004080611281096935, -0.0032965783029794693, -0.0025125453248620033, -0.0017285123467445374, -0.0009444793686270714, -0.0001604463905096054, 0.0006235865876078606, 0.0014076195657253265, 0.0021916525438427925, 0.0029756855219602585, 0.0037597185000777245, 0.00454375147819519, 0.005327784456312656, 0.006111817434430122, 0.006895850412547588, 0.007679883390665054, 0.00846391636878252, 0.009247949346899986, 0.010031982325017452, 0.010816015303134918, 0.011600048281252384, 0.01238408125936985, 0.013168114237487316, 0.013952147215604782, 0.014736180193722248, 0.015520213171839714, 0.016304247081279755, 0.017088279128074646, 0.017872311174869537, 0.018656345084309578, 0.01944037899374962, 0.02022441104054451, 0.0210084430873394, 0.021792476996779442, 0.022576510906219482, 0.023360542953014374, 0.024144574999809265, 0.024928608909249306, 0.025712642818689346, 0.026496674865484238, 0.02728070691227913, 0.02806474082171917, 0.02884877473115921, 0.0296328067779541]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 8.0, 7.0, 7.0, 9.0, 19.0, 18.0, 28.0, 40.0, 46.0, 62.0, 88.0, 143.0, 222.0, 347.0, 594.0, 1253.0, 6530.0, 752581.0, 280190.0, 3875.0, 1010.0, 502.0, 309.0, 174.0, 153.0, 88.0, 65.0, 43.0, 28.0, 30.0, 27.0, 11.0, 11.0, 6.0, 4.0, 7.0, 8.0, 1.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.048492431640625, -0.04687023162841797, -0.04524803161621094, -0.043625831604003906, -0.042003631591796875, -0.040381431579589844, -0.03875923156738281, -0.03713703155517578, -0.03551483154296875, -0.03389263153076172, -0.03227043151855469, -0.030648231506347656, -0.029026031494140625, -0.027403831481933594, -0.025781631469726562, -0.02415943145751953, -0.0225372314453125, -0.02091503143310547, -0.019292831420898438, -0.017670631408691406, -0.016048431396484375, -0.014426231384277344, -0.012804031372070312, -0.011181831359863281, -0.00955963134765625, -0.007937431335449219, -0.0063152313232421875, -0.004693031311035156, -0.003070831298828125, -0.0014486312866210938, 0.0001735687255859375, 0.0017957687377929688, 0.00341796875, 0.005040168762207031, 0.0066623687744140625, 0.008284568786621094, 0.009906768798828125, 0.011528968811035156, 0.013151168823242188, 0.014773368835449219, 0.01639556884765625, 0.01801776885986328, 0.019639968872070312, 0.021262168884277344, 0.022884368896484375, 0.024506568908691406, 0.026128768920898438, 0.02775096893310547, 0.0293731689453125, 0.03099536895751953, 0.03261756896972656, 0.034239768981933594, 0.035861968994140625, 0.037484169006347656, 0.03910636901855469, 0.04072856903076172, 0.04235076904296875, 0.04397296905517578, 0.04559516906738281, 0.047217369079589844, 0.048839569091796875, 0.050461769104003906, 0.05208396911621094, 0.05370616912841797, 0.055328369140625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 8.0, 69.0, 230.0, 384.0, 233.0, 63.0, 15.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.022247314453125, -0.0217360258102417, -0.0212247371673584, -0.020713448524475098, -0.020202159881591797, -0.019690871238708496, -0.019179582595825195, -0.018668293952941895, -0.018157005310058594, -0.017645716667175293, -0.017134428024291992, -0.01662313938140869, -0.01611185073852539, -0.01560056209564209, -0.015089273452758789, -0.014577984809875488, -0.014066696166992188, -0.013555407524108887, -0.013044118881225586, -0.012532830238342285, -0.012021541595458984, -0.011510252952575684, -0.010998964309692383, -0.010487675666809082, -0.009976387023925781, -0.00946509838104248, -0.00895380973815918, -0.008442521095275879, -0.007931232452392578, -0.007419943809509277, -0.0069086551666259766, -0.006397366523742676, -0.005886077880859375, -0.005374789237976074, -0.0048635005950927734, -0.004352211952209473, -0.003840923309326172, -0.003329634666442871, -0.0028183460235595703, -0.0023070573806762695, -0.0017957687377929688, -0.001284480094909668, -0.0007731914520263672, -0.0002619028091430664, 0.0002493858337402344, 0.0007606744766235352, 0.001271963119506836, 0.0017832517623901367, 0.0022945404052734375, 0.0028058290481567383, 0.003317117691040039, 0.00382840633392334, 0.004339694976806641, 0.004850983619689941, 0.005362272262573242, 0.005873560905456543, 0.006384849548339844, 0.0068961381912231445, 0.007407426834106445, 0.007918715476989746, 0.008430004119873047, 0.008941292762756348, 0.009452581405639648, 0.00996387004852295, 0.01047515869140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 3.0, 4.0, 6.0, 5.0, 10.0, 9.0, 13.0, 20.0, 27.0, 61.0, 59.0, 100.0, 156.0, 257.0, 391.0, 693.0, 1471.0, 4062.0, 26835.0, 452239.0, 522150.0, 32202.0, 4385.0, 1499.0, 731.0, 435.0, 243.0, 171.0, 99.0, 59.0, 40.0, 34.0, 26.0, 17.0, 15.0, 11.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.024139404296875, -0.023487567901611328, -0.022835731506347656, -0.022183895111083984, -0.021532058715820312, -0.02088022232055664, -0.02022838592529297, -0.019576549530029297, -0.018924713134765625, -0.018272876739501953, -0.01762104034423828, -0.01696920394897461, -0.016317367553710938, -0.015665531158447266, -0.015013694763183594, -0.014361858367919922, -0.01371002197265625, -0.013058185577392578, -0.012406349182128906, -0.011754512786865234, -0.011102676391601562, -0.01045083999633789, -0.009799003601074219, -0.009147167205810547, -0.008495330810546875, -0.007843494415283203, -0.007191658020019531, -0.006539821624755859, -0.0058879852294921875, -0.005236148834228516, -0.004584312438964844, -0.003932476043701172, -0.0032806396484375, -0.002628803253173828, -0.0019769668579101562, -0.0013251304626464844, -0.0006732940673828125, -2.1457672119140625e-05, 0.0006303787231445312, 0.0012822151184082031, 0.001934051513671875, 0.002585887908935547, 0.0032377243041992188, 0.0038895606994628906, 0.0045413970947265625, 0.005193233489990234, 0.005845069885253906, 0.006496906280517578, 0.00714874267578125, 0.007800579071044922, 0.008452415466308594, 0.009104251861572266, 0.009756088256835938, 0.01040792465209961, 0.011059761047363281, 0.011711597442626953, 0.012363433837890625, 0.013015270233154297, 0.013667106628417969, 0.01431894302368164, 0.014970779418945312, 0.015622615814208984, 0.016274452209472656, 0.016926288604736328, 0.017578125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 5.0, 5.0, 4.0, 11.0, 8.0, 21.0, 14.0, 17.0, 17.0, 24.0, 40.0, 46.0, 41.0, 47.0, 54.0, 46.0, 47.0, 50.0, 53.0, 52.0, 53.0, 52.0, 40.0, 41.0, 36.0, 24.0, 35.0, 20.0, 21.0, 18.0, 14.0, 10.0, 8.0, 5.0, 5.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0101470947265625, -0.00987231731414795, -0.009597539901733398, -0.009322762489318848, -0.009047985076904297, -0.008773207664489746, -0.008498430252075195, -0.008223652839660645, -0.007948875427246094, -0.007674098014831543, -0.007399320602416992, -0.007124543190002441, -0.006849765777587891, -0.00657498836517334, -0.006300210952758789, -0.006025433540344238, -0.0057506561279296875, -0.005475878715515137, -0.005201101303100586, -0.004926323890686035, -0.004651546478271484, -0.004376769065856934, -0.004101991653442383, -0.003827214241027832, -0.0035524368286132812, -0.0032776594161987305, -0.0030028820037841797, -0.002728104591369629, -0.002453327178955078, -0.0021785497665405273, -0.0019037723541259766, -0.0016289949417114258, -0.001354217529296875, -0.0010794401168823242, -0.0008046627044677734, -0.0005298852920532227, -0.0002551078796386719, 1.9669532775878906e-05, 0.0002944469451904297, 0.0005692243576049805, 0.0008440017700195312, 0.001118779182434082, 0.0013935565948486328, 0.0016683340072631836, 0.0019431114196777344, 0.002217888832092285, 0.002492666244506836, 0.0027674436569213867, 0.0030422210693359375, 0.0033169984817504883, 0.003591775894165039, 0.00386655330657959, 0.004141330718994141, 0.004416108131408691, 0.004690885543823242, 0.004965662956237793, 0.005240440368652344, 0.0055152177810668945, 0.005789995193481445, 0.006064772605895996, 0.006339550018310547, 0.006614327430725098, 0.0068891048431396484, 0.007163882255554199, 0.00743865966796875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 8.0, 3.0, 2.0, 6.0, 7.0, 20.0, 24.0, 41.0, 66.0, 146.0, 304.0, 722.0, 1699.0, 5258.0, 27536.0, 925361.0, 75692.0, 7539.0, 2380.0, 904.0, 415.0, 183.0, 100.0, 42.0, 34.0, 20.0, 14.0, 11.0, 2.0, 9.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02093505859375, -0.020363926887512207, -0.019792795181274414, -0.01922166347503662, -0.018650531768798828, -0.018079400062561035, -0.017508268356323242, -0.01693713665008545, -0.016366004943847656, -0.015794873237609863, -0.01522374153137207, -0.014652609825134277, -0.014081478118896484, -0.013510346412658691, -0.012939214706420898, -0.012368083000183105, -0.011796951293945312, -0.01122581958770752, -0.010654687881469727, -0.010083556175231934, -0.00951242446899414, -0.008941292762756348, -0.008370161056518555, -0.007799029350280762, -0.007227897644042969, -0.006656765937805176, -0.006085634231567383, -0.00551450252532959, -0.004943370819091797, -0.004372239112854004, -0.003801107406616211, -0.003229975700378418, -0.002658843994140625, -0.002087712287902832, -0.001516580581665039, -0.0009454488754272461, -0.0003743171691894531, 0.00019681453704833984, 0.0007679462432861328, 0.0013390779495239258, 0.0019102096557617188, 0.0024813413619995117, 0.0030524730682373047, 0.0036236047744750977, 0.004194736480712891, 0.004765868186950684, 0.0053369998931884766, 0.0059081315994262695, 0.0064792633056640625, 0.0070503950119018555, 0.0076215267181396484, 0.008192658424377441, 0.008763790130615234, 0.009334921836853027, 0.00990605354309082, 0.010477185249328613, 0.011048316955566406, 0.0116194486618042, 0.012190580368041992, 0.012761712074279785, 0.013332843780517578, 0.013903975486755371, 0.014475107192993164, 0.015046238899230957, 0.01561737060546875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 4.0, 6.0, 3.0, 3.0, 7.0, 5.0, 5.0, 6.0, 7.0, 5.0, 7.0, 6.0, 13.0, 13.0, 18.0, 13.0, 22.0, 22.0, 24.0, 35.0, 40.0, 42.0, 59.0, 68.0, 88.0, 66.0, 58.0, 50.0, 43.0, 45.0, 37.0, 32.0, 21.0, 19.0, 19.0, 18.0, 13.0, 13.0, 4.0, 6.0, 8.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 4.0, 4.0, 3.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.943941116333008e-05, -6.703101098537445e-05, -6.462261080741882e-05, -6.22142106294632e-05, -5.980581045150757e-05, -5.739741027355194e-05, -5.4989010095596313e-05, -5.2580609917640686e-05, -5.017220973968506e-05, -4.776380956172943e-05, -4.5355409383773804e-05, -4.2947009205818176e-05, -4.053860902786255e-05, -3.813020884990692e-05, -3.5721808671951294e-05, -3.3313408493995667e-05, -3.090500831604004e-05, -2.849660813808441e-05, -2.6088207960128784e-05, -2.3679807782173157e-05, -2.127140760421753e-05, -1.8863007426261902e-05, -1.6454607248306274e-05, -1.4046207070350647e-05, -1.163780689239502e-05, -9.229406714439392e-06, -6.821006536483765e-06, -4.412606358528137e-06, -2.0042061805725098e-06, 4.041939973831177e-07, 2.812594175338745e-06, 5.2209943532943726e-06, 7.62939453125e-06, 1.0037794709205627e-05, 1.2446194887161255e-05, 1.4854595065116882e-05, 1.726299524307251e-05, 1.9671395421028137e-05, 2.2079795598983765e-05, 2.4488195776939392e-05, 2.689659595489502e-05, 2.9304996132850647e-05, 3.1713396310806274e-05, 3.41217964887619e-05, 3.653019666671753e-05, 3.893859684467316e-05, 4.1346997022628784e-05, 4.375539720058441e-05, 4.616379737854004e-05, 4.8572197556495667e-05, 5.0980597734451294e-05, 5.338899791240692e-05, 5.579739809036255e-05, 5.8205798268318176e-05, 6.0614198446273804e-05, 6.302259862422943e-05, 6.543099880218506e-05, 6.783939898014069e-05, 7.024779915809631e-05, 7.265619933605194e-05, 7.506459951400757e-05, 7.74729996919632e-05, 7.988139986991882e-05, 8.228980004787445e-05, 8.469820022583008e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 6.0, 9.0, 10.0, 12.0, 24.0, 20.0, 33.0, 56.0, 85.0, 129.0, 269.0, 594.0, 1445.0, 4657.0, 24605.0, 853060.0, 148413.0, 10510.0, 2691.0, 942.0, 413.0, 220.0, 116.0, 71.0, 42.0, 23.0, 22.0, 19.0, 14.0, 11.0, 3.0, 5.0, 5.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.016082763671875, -0.01560664176940918, -0.01513051986694336, -0.014654397964477539, -0.014178276062011719, -0.013702154159545898, -0.013226032257080078, -0.012749910354614258, -0.012273788452148438, -0.011797666549682617, -0.011321544647216797, -0.010845422744750977, -0.010369300842285156, -0.009893178939819336, -0.009417057037353516, -0.008940935134887695, -0.008464813232421875, -0.007988691329956055, -0.007512569427490234, -0.007036447525024414, -0.006560325622558594, -0.0060842037200927734, -0.005608081817626953, -0.005131959915161133, -0.0046558380126953125, -0.004179716110229492, -0.003703594207763672, -0.0032274723052978516, -0.0027513504028320312, -0.002275228500366211, -0.0017991065979003906, -0.0013229846954345703, -0.00084686279296875, -0.0003707408905029297, 0.00010538101196289062, 0.0005815029144287109, 0.0010576248168945312, 0.0015337467193603516, 0.002009868621826172, 0.002485990524291992, 0.0029621124267578125, 0.003438234329223633, 0.003914356231689453, 0.0043904781341552734, 0.004866600036621094, 0.005342721939086914, 0.005818843841552734, 0.006294965744018555, 0.006771087646484375, 0.007247209548950195, 0.007723331451416016, 0.008199453353881836, 0.008675575256347656, 0.009151697158813477, 0.009627819061279297, 0.010103940963745117, 0.010580062866210938, 0.011056184768676758, 0.011532306671142578, 0.012008428573608398, 0.012484550476074219, 0.012960672378540039, 0.01343679428100586, 0.01391291618347168, 0.0143890380859375]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 4.0, 1.0, 2.0, 8.0, 7.0, 6.0, 10.0, 13.0, 18.0, 31.0, 47.0, 71.0, 114.0, 149.0, 155.0, 106.0, 81.0, 44.0, 38.0, 22.0, 22.0, 7.0, 7.0, 8.0, 6.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005096435546875, -0.00493699312210083, -0.00477755069732666, -0.00461810827255249, -0.00445866584777832, -0.00429922342300415, -0.0041397809982299805, -0.0039803385734558105, -0.0038208961486816406, -0.0036614537239074707, -0.0035020112991333008, -0.003342568874359131, -0.003183126449584961, -0.003023684024810791, -0.002864241600036621, -0.002704799175262451, -0.0025453567504882812, -0.0023859143257141113, -0.0022264719009399414, -0.0020670294761657715, -0.0019075870513916016, -0.0017481446266174316, -0.0015887022018432617, -0.0014292597770690918, -0.0012698173522949219, -0.001110374927520752, -0.000950932502746582, -0.0007914900779724121, -0.0006320476531982422, -0.00047260522842407227, -0.00031316280364990234, -0.00015372037887573242, 5.7220458984375e-06, 0.00016516447067260742, 0.00032460689544677734, 0.00048404932022094727, 0.0006434917449951172, 0.0008029341697692871, 0.000962376594543457, 0.001121819019317627, 0.0012812614440917969, 0.0014407038688659668, 0.0016001462936401367, 0.0017595887184143066, 0.0019190311431884766, 0.0020784735679626465, 0.0022379159927368164, 0.0023973584175109863, 0.0025568008422851562, 0.002716243267059326, 0.002875685691833496, 0.003035128116607666, 0.003194570541381836, 0.003354012966156006, 0.0035134553909301758, 0.0036728978157043457, 0.0038323402404785156, 0.0039917826652526855, 0.0041512250900268555, 0.004310667514801025, 0.004470109939575195, 0.004629552364349365, 0.004788994789123535, 0.004948437213897705, 0.005107879638671875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 10.0, 41.0, 178.0, 465.0, 222.0, 68.0, 10.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16380207240581512, -0.15944521129131317, -0.15508833527565002, -0.15073147416114807, -0.14637459814548492, -0.14201773703098297, -0.13766086101531982, -0.13330399990081787, -0.12894713878631592, -0.12459027022123337, -0.12023340165615082, -0.11587653309106827, -0.11151966452598572, -0.10716280341148376, -0.10280593484640121, -0.09844906628131866, -0.09409219026565552, -0.08973532170057297, -0.08537845313549042, -0.08102158457040787, -0.07666471600532532, -0.07230785489082336, -0.06795098632574081, -0.06359411776065826, -0.059237249195575714, -0.054880380630493164, -0.050523512065410614, -0.04616664722561836, -0.04180977866053581, -0.03745291009545326, -0.03309604525566101, -0.02873917669057846, -0.024382293224334717, -0.020025424659252167, -0.015668557956814766, -0.01131169032305479, -0.006954822689294815, -0.002597954124212265, 0.0017589125782251358, 0.006115779280662537, 0.010472647845745087, 0.014829515479505062, 0.019186383113265038, 0.02354324981570244, 0.02790011838078499, 0.03225698694586754, 0.03661385178565979, 0.04097072035074234, 0.04532758891582489, 0.04968445748090744, 0.05404132604598999, 0.05839819088578224, 0.06275506317615509, 0.06711192429065704, 0.0714687928557396, 0.07582566142082214, 0.0801825299859047, 0.08453939855098724, 0.0888962671160698, 0.09325313568115234, 0.0976099967956543, 0.10196687281131744, 0.1063237339258194, 0.11068060249090195, 0.1150374710559845]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 7.0, 6.0, 18.0, 19.0, 26.0, 31.0, 39.0, 64.0, 50.0, 78.0, 74.0, 68.0, 86.0, 65.0, 72.0, 50.0, 66.0, 39.0, 37.0, 32.0, 24.0, 14.0, 11.0, 6.0, 7.0, 2.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04028785228729248, -0.03885223716497421, -0.037416622042655945, -0.03598100319504738, -0.03454538807272911, -0.03310977295041084, -0.03167415410280228, -0.03023853898048401, -0.02880292385816574, -0.027367308735847473, -0.025931691750884056, -0.02449607476592064, -0.02306045964360237, -0.021624844521284103, -0.020189227536320686, -0.01875361055135727, -0.017317995429039, -0.015882380306720734, -0.014446763321757317, -0.013011147268116474, -0.011575531214475632, -0.01013991516083479, -0.008704299107193947, -0.007268683053553104, -0.005833066999912262, -0.0043974509462714195, -0.002961834892630577, -0.0015262188389897346, -9.060278534889221e-05, 0.0013450132682919502, 0.0027806293219327927, 0.004216245375573635, 0.0056518614292144775, 0.00708747748285532, 0.008523093536496162, 0.009958709590137005, 0.011394325643777847, 0.01282994169741869, 0.014265557751059532, 0.01570117473602295, 0.017136789858341217, 0.018572404980659485, 0.020008021965622902, 0.02144363895058632, 0.022879254072904587, 0.024314869195222855, 0.02575048618018627, 0.02718610316514969, 0.028621718287467957, 0.030057333409786224, 0.03149294853210449, 0.03292856737971306, 0.034364182502031326, 0.035799797624349594, 0.03723541647195816, 0.03867103159427643, 0.040106646716594696, 0.041542261838912964, 0.04297787696123123, 0.0444134958088398, 0.045849110931158066, 0.047284726053476334, 0.0487203449010849, 0.05015596002340317, 0.051591575145721436]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 1.0, 5.0, 5.0, 9.0, 10.0, 9.0, 22.0, 29.0, 33.0, 34.0, 56.0, 80.0, 105.0, 134.0, 179.0, 279.0, 555.0, 2337.0, 21483.0, 4062604.0, 98407.0, 4461.0, 1886.0, 1007.0, 240.0, 122.0, 70.0, 36.0, 28.0, 19.0, 11.0, 8.0, 4.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0299072265625, -0.029069185256958008, -0.028231143951416016, -0.027393102645874023, -0.02655506134033203, -0.02571702003479004, -0.024878978729248047, -0.024040937423706055, -0.023202896118164062, -0.02236485481262207, -0.021526813507080078, -0.020688772201538086, -0.019850730895996094, -0.0190126895904541, -0.01817464828491211, -0.017336606979370117, -0.016498565673828125, -0.015660524368286133, -0.01482248306274414, -0.013984441757202148, -0.013146400451660156, -0.012308359146118164, -0.011470317840576172, -0.01063227653503418, -0.009794235229492188, -0.008956193923950195, -0.008118152618408203, -0.007280111312866211, -0.006442070007324219, -0.0056040287017822266, -0.004765987396240234, -0.003927946090698242, -0.00308990478515625, -0.002251863479614258, -0.0014138221740722656, -0.0005757808685302734, 0.00026226043701171875, 0.001100301742553711, 0.0019383430480957031, 0.0027763843536376953, 0.0036144256591796875, 0.00445246696472168, 0.005290508270263672, 0.006128549575805664, 0.006966590881347656, 0.0078046321868896484, 0.00864267349243164, 0.009480714797973633, 0.010318756103515625, 0.011156797409057617, 0.01199483871459961, 0.012832880020141602, 0.013670921325683594, 0.014508962631225586, 0.015347003936767578, 0.01618504524230957, 0.017023086547851562, 0.017861127853393555, 0.018699169158935547, 0.01953721046447754, 0.02037525177001953, 0.021213293075561523, 0.022051334381103516, 0.022889375686645508, 0.0237274169921875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 13.0, 57.0, 184.0, 352.0, 291.0, 89.0, 18.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0232391357421875, -0.022694945335388184, -0.022150754928588867, -0.02160656452178955, -0.021062374114990234, -0.020518183708190918, -0.0199739933013916, -0.019429802894592285, -0.01888561248779297, -0.018341422080993652, -0.017797231674194336, -0.01725304126739502, -0.016708850860595703, -0.016164660453796387, -0.01562047004699707, -0.015076279640197754, -0.014532089233398438, -0.013987898826599121, -0.013443708419799805, -0.012899518013000488, -0.012355327606201172, -0.011811137199401855, -0.011266946792602539, -0.010722756385803223, -0.010178565979003906, -0.00963437557220459, -0.009090185165405273, -0.008545994758605957, -0.00800180435180664, -0.007457613945007324, -0.006913423538208008, -0.006369233131408691, -0.005825042724609375, -0.005280852317810059, -0.004736661911010742, -0.004192471504211426, -0.0036482810974121094, -0.003104090690612793, -0.0025599002838134766, -0.00201570987701416, -0.0014715194702148438, -0.0009273290634155273, -0.00038313865661621094, 0.00016105175018310547, 0.0007052421569824219, 0.0012494325637817383, 0.0017936229705810547, 0.002337813377380371, 0.0028820037841796875, 0.003426194190979004, 0.00397038459777832, 0.004514575004577637, 0.005058765411376953, 0.0056029558181762695, 0.006147146224975586, 0.006691336631774902, 0.007235527038574219, 0.007779717445373535, 0.008323907852172852, 0.008868098258972168, 0.009412288665771484, 0.0099564790725708, 0.010500669479370117, 0.011044859886169434, 0.01158905029296875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 8.0, 5.0, 14.0, 17.0, 27.0, 52.0, 97.0, 162.0, 365.0, 977.0, 3591.0, 50054.0, 4035391.0, 97015.0, 4592.0, 1143.0, 377.0, 176.0, 86.0, 44.0, 24.0, 11.0, 13.0, 9.0, 7.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0233001708984375, -0.022680044174194336, -0.022059917449951172, -0.021439790725708008, -0.020819664001464844, -0.02019953727722168, -0.019579410552978516, -0.01895928382873535, -0.018339157104492188, -0.017719030380249023, -0.01709890365600586, -0.016478776931762695, -0.01585865020751953, -0.015238523483276367, -0.014618396759033203, -0.013998270034790039, -0.013378143310546875, -0.012758016586303711, -0.012137889862060547, -0.011517763137817383, -0.010897636413574219, -0.010277509689331055, -0.00965738296508789, -0.009037256240844727, -0.008417129516601562, -0.0077970027923583984, -0.007176876068115234, -0.00655674934387207, -0.005936622619628906, -0.005316495895385742, -0.004696369171142578, -0.004076242446899414, -0.00345611572265625, -0.002835988998413086, -0.002215862274169922, -0.0015957355499267578, -0.0009756088256835938, -0.0003554821014404297, 0.0002646446228027344, 0.0008847713470458984, 0.0015048980712890625, 0.0021250247955322266, 0.0027451515197753906, 0.0033652782440185547, 0.003985404968261719, 0.004605531692504883, 0.005225658416748047, 0.005845785140991211, 0.006465911865234375, 0.007086038589477539, 0.007706165313720703, 0.008326292037963867, 0.008946418762207031, 0.009566545486450195, 0.01018667221069336, 0.010806798934936523, 0.011426925659179688, 0.012047052383422852, 0.012667179107666016, 0.01328730583190918, 0.013907432556152344, 0.014527559280395508, 0.015147686004638672, 0.015767812728881836, 0.016387939453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 5.0, 4.0, 6.0, 9.0, 15.0, 26.0, 47.0, 66.0, 123.0, 312.0, 865.0, 1325.0, 645.0, 283.0, 136.0, 90.0, 53.0, 34.0, 15.0, 6.0, 2.0, 7.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007656097412109375, -0.007354080677032471, -0.007052063941955566, -0.006750047206878662, -0.006448030471801758, -0.0061460137367248535, -0.005843997001647949, -0.005541980266571045, -0.005239963531494141, -0.004937946796417236, -0.004635930061340332, -0.004333913326263428, -0.0040318965911865234, -0.003729879856109619, -0.003427863121032715, -0.0031258463859558105, -0.0028238296508789062, -0.002521812915802002, -0.0022197961807250977, -0.0019177794456481934, -0.001615762710571289, -0.0013137459754943848, -0.0010117292404174805, -0.0007097125053405762, -0.0004076957702636719, -0.00010567903518676758, 0.00019633769989013672, 0.000498354434967041, 0.0008003711700439453, 0.0011023879051208496, 0.001404404640197754, 0.0017064213752746582, 0.0020084381103515625, 0.002310454845428467, 0.002612471580505371, 0.0029144883155822754, 0.0032165050506591797, 0.003518521785736084, 0.0038205385208129883, 0.004122555255889893, 0.004424571990966797, 0.004726588726043701, 0.0050286054611206055, 0.00533062219619751, 0.005632638931274414, 0.005934655666351318, 0.006236672401428223, 0.006538689136505127, 0.006840705871582031, 0.0071427226066589355, 0.00744473934173584, 0.007746756076812744, 0.008048772811889648, 0.008350789546966553, 0.008652806282043457, 0.008954823017120361, 0.009256839752197266, 0.00955885648727417, 0.009860873222351074, 0.010162889957427979, 0.010464906692504883, 0.010766923427581787, 0.011068940162658691, 0.011370956897735596, 0.0116729736328125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 7.0, 41.0, 168.0, 339.0, 268.0, 111.0, 34.0, 17.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041651468724012375, -0.03972947224974632, -0.03780747950077057, -0.03588548302650452, -0.033963486552238464, -0.03204149380326271, -0.03011949732899666, -0.028197502717375755, -0.026275508105754852, -0.02435351349413395, -0.022431518882513046, -0.020509522408246994, -0.01858752779662609, -0.016665533185005188, -0.01474353764206171, -0.012821542099118233, -0.01089954748749733, -0.008977552875876427, -0.007055557332932949, -0.005133562255650759, -0.0032115671783685684, -0.0012895725667476654, 0.0006324229761958122, 0.00255441851913929, 0.004476413130760193, 0.006398408208042383, 0.008320403285324574, 0.010242398828268051, 0.012164393439888954, 0.014086388051509857, 0.01600838452577591, 0.017930379137396812, 0.019852377474308014, 0.021774372085928917, 0.02369636669754982, 0.025618363171815872, 0.027540357783436775, 0.029462352395057678, 0.03138434886932373, 0.03330634534358978, 0.035228338092565536, 0.03715033456683159, 0.03907232731580734, 0.040994323790073395, 0.04291632026433945, 0.0448383130133152, 0.04676030948758125, 0.04868230223655701, 0.05060429871082306, 0.05252629518508911, 0.054448287934064865, 0.05637028440833092, 0.05829227715730667, 0.06021427363157272, 0.062136270105838776, 0.06405826658010483, 0.06598025560379028, 0.06790225207805634, 0.06982424855232239, 0.07174623757600784, 0.0736682340502739, 0.07559023052453995, 0.077512226998806, 0.07943422347307205, 0.0813562199473381]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 7.0, 8.0, 12.0, 18.0, 9.0, 23.0, 27.0, 43.0, 33.0, 49.0, 56.0, 50.0, 50.0, 64.0, 57.0, 69.0, 58.0, 52.0, 60.0, 40.0, 50.0, 37.0, 29.0, 25.0, 28.0, 10.0, 11.0, 4.0, 11.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024130165576934814, -0.023473240435123444, -0.022816317155957222, -0.022159393876791, -0.02150246873497963, -0.02084554359316826, -0.020188620314002037, -0.019531697034835815, -0.018874771893024445, -0.018217846751213074, -0.017560923472046852, -0.01690400019288063, -0.01624707505106926, -0.015590150840580463, -0.014933226630091667, -0.014276302419602871, -0.013619378209114075, -0.012962453998625278, -0.012305529788136482, -0.011648605577647686, -0.01099168136715889, -0.010334757156670094, -0.009677832946181297, -0.009020908735692501, -0.008363984525203705, -0.007707060314714909, -0.007050136104226112, -0.006393211893737316, -0.00573628768324852, -0.005079363472759724, -0.004422439262270927, -0.003765515051782131, -0.003108590841293335, -0.0024516666308045387, -0.0017947424203157425, -0.0011378182098269463, -0.00048089399933815, 0.0001760302111506462, 0.0008329544216394424, 0.0014898786321282387, 0.002146802842617035, 0.002803727053105831, 0.0034606512635946274, 0.004117575474083424, 0.00477449968457222, 0.005431423895061016, 0.006088348105549812, 0.0067452723160386086, 0.007402196526527405, 0.008059120737016201, 0.008716044947504997, 0.009372969157993793, 0.01002989336848259, 0.010686817578971386, 0.011343741789460182, 0.012000665999948978, 0.012657590210437775, 0.013314514420926571, 0.013971438631415367, 0.014628362841904163, 0.01528528705239296, 0.01594221219420433, 0.016599135473370552, 0.017256058752536774, 0.017912983894348145]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 3.0, 6.0, 5.0, 8.0, 11.0, 13.0, 20.0, 23.0, 33.0, 50.0, 74.0, 89.0, 153.0, 184.0, 278.0, 429.0, 734.0, 1548.0, 10187.0, 635336.0, 389137.0, 6768.0, 1403.0, 711.0, 441.0, 263.0, 186.0, 118.0, 92.0, 56.0, 50.0, 35.0, 24.0, 15.0, 17.0, 12.0, 21.0, 5.0, 3.0, 0.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 3.0, 4.0], "bins": [-0.030731201171875, -0.029875993728637695, -0.02902078628540039, -0.028165578842163086, -0.02731037139892578, -0.026455163955688477, -0.025599956512451172, -0.024744749069213867, -0.023889541625976562, -0.023034334182739258, -0.022179126739501953, -0.02132391929626465, -0.020468711853027344, -0.01961350440979004, -0.018758296966552734, -0.01790308952331543, -0.017047882080078125, -0.01619267463684082, -0.015337467193603516, -0.014482259750366211, -0.013627052307128906, -0.012771844863891602, -0.011916637420654297, -0.011061429977416992, -0.010206222534179688, -0.009351015090942383, -0.008495807647705078, -0.0076406002044677734, -0.006785392761230469, -0.005930185317993164, -0.005074977874755859, -0.004219770431518555, -0.00336456298828125, -0.0025093555450439453, -0.0016541481018066406, -0.0007989406585693359, 5.626678466796875e-05, 0.0009114742279052734, 0.0017666816711425781, 0.002621889114379883, 0.0034770965576171875, 0.004332304000854492, 0.005187511444091797, 0.0060427188873291016, 0.006897926330566406, 0.007753133773803711, 0.008608341217041016, 0.00946354866027832, 0.010318756103515625, 0.01117396354675293, 0.012029170989990234, 0.012884378433227539, 0.013739585876464844, 0.014594793319702148, 0.015450000762939453, 0.016305208206176758, 0.017160415649414062, 0.018015623092651367, 0.018870830535888672, 0.019726037979125977, 0.02058124542236328, 0.021436452865600586, 0.02229166030883789, 0.023146867752075195, 0.0240020751953125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 6.0, 36.0, 153.0, 354.0, 330.0, 107.0, 20.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0234527587890625, -0.022905349731445312, -0.022357940673828125, -0.021810531616210938, -0.02126312255859375, -0.020715713500976562, -0.020168304443359375, -0.019620895385742188, -0.019073486328125, -0.018526077270507812, -0.017978668212890625, -0.017431259155273438, -0.01688385009765625, -0.016336441040039062, -0.015789031982421875, -0.015241622924804688, -0.0146942138671875, -0.014146804809570312, -0.013599395751953125, -0.013051986694335938, -0.01250457763671875, -0.011957168579101562, -0.011409759521484375, -0.010862350463867188, -0.01031494140625, -0.009767532348632812, -0.009220123291015625, -0.008672714233398438, -0.00812530517578125, -0.0075778961181640625, -0.007030487060546875, -0.0064830780029296875, -0.0059356689453125, -0.0053882598876953125, -0.004840850830078125, -0.0042934417724609375, -0.00374603271484375, -0.0031986236572265625, -0.002651214599609375, -0.0021038055419921875, -0.001556396484375, -0.0010089874267578125, -0.000461578369140625, 8.58306884765625e-05, 0.00063323974609375, 0.0011806488037109375, 0.001728057861328125, 0.0022754669189453125, 0.0028228759765625, 0.0033702850341796875, 0.003917694091796875, 0.0044651031494140625, 0.00501251220703125, 0.0055599212646484375, 0.006107330322265625, 0.0066547393798828125, 0.0072021484375, 0.0077495574951171875, 0.008296966552734375, 0.008844375610351562, 0.00939178466796875, 0.009939193725585938, 0.010486602783203125, 0.011034011840820312, 0.0115814208984375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 8.0, 7.0, 13.0, 18.0, 31.0, 31.0, 43.0, 55.0, 60.0, 98.0, 139.0, 202.0, 302.0, 448.0, 813.0, 1543.0, 5265.0, 38947.0, 487099.0, 467494.0, 36983.0, 5114.0, 1528.0, 829.0, 457.0, 294.0, 217.0, 137.0, 107.0, 74.0, 59.0, 29.0, 35.0, 28.0, 14.0, 7.0, 6.0, 8.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01222991943359375, -0.011808037757873535, -0.01138615608215332, -0.010964274406433105, -0.01054239273071289, -0.010120511054992676, -0.009698629379272461, -0.009276747703552246, -0.008854866027832031, -0.008432984352111816, -0.008011102676391602, -0.007589221000671387, -0.007167339324951172, -0.006745457649230957, -0.006323575973510742, -0.005901694297790527, -0.0054798126220703125, -0.005057930946350098, -0.004636049270629883, -0.004214167594909668, -0.003792285919189453, -0.0033704042434692383, -0.0029485225677490234, -0.0025266408920288086, -0.0021047592163085938, -0.001682877540588379, -0.001260995864868164, -0.0008391141891479492, -0.0004172325134277344, 4.649162292480469e-06, 0.0004265308380126953, 0.0008484125137329102, 0.001270294189453125, 0.0016921758651733398, 0.0021140575408935547, 0.0025359392166137695, 0.0029578208923339844, 0.0033797025680541992, 0.003801584243774414, 0.004223465919494629, 0.004645347595214844, 0.005067229270935059, 0.0054891109466552734, 0.005910992622375488, 0.006332874298095703, 0.006754755973815918, 0.007176637649536133, 0.007598519325256348, 0.008020401000976562, 0.008442282676696777, 0.008864164352416992, 0.009286046028137207, 0.009707927703857422, 0.010129809379577637, 0.010551691055297852, 0.010973572731018066, 0.011395454406738281, 0.011817336082458496, 0.012239217758178711, 0.012661099433898926, 0.01308298110961914, 0.013504862785339355, 0.01392674446105957, 0.014348626136779785, 0.0147705078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 5.0, 11.0, 11.0, 17.0, 20.0, 20.0, 30.0, 33.0, 30.0, 41.0, 34.0, 34.0, 50.0, 46.0, 34.0, 55.0, 42.0, 53.0, 52.0, 60.0, 42.0, 37.0, 32.0, 44.0, 27.0, 30.0, 22.0, 19.0, 13.0, 13.0, 10.0, 4.0, 7.0, 7.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.00963592529296875, -0.00936514139175415, -0.00909435749053955, -0.008823573589324951, -0.008552789688110352, -0.008282005786895752, -0.008011221885681152, -0.007740437984466553, -0.007469654083251953, -0.0071988701820373535, -0.006928086280822754, -0.006657302379608154, -0.006386518478393555, -0.006115734577178955, -0.0058449506759643555, -0.005574166774749756, -0.005303382873535156, -0.005032598972320557, -0.004761815071105957, -0.004491031169891357, -0.004220247268676758, -0.003949463367462158, -0.0036786794662475586, -0.003407895565032959, -0.0031371116638183594, -0.0028663277626037598, -0.00259554386138916, -0.0023247599601745605, -0.002053976058959961, -0.0017831921577453613, -0.0015124082565307617, -0.0012416243553161621, -0.0009708404541015625, -0.0007000565528869629, -0.0004292726516723633, -0.00015848875045776367, 0.00011229515075683594, 0.00038307905197143555, 0.0006538629531860352, 0.0009246468544006348, 0.0011954307556152344, 0.001466214656829834, 0.0017369985580444336, 0.002007782459259033, 0.002278566360473633, 0.0025493502616882324, 0.002820134162902832, 0.0030909180641174316, 0.0033617019653320312, 0.003632485866546631, 0.0039032697677612305, 0.00417405366897583, 0.00444483757019043, 0.004715621471405029, 0.004986405372619629, 0.0052571892738342285, 0.005527973175048828, 0.005798757076263428, 0.006069540977478027, 0.006340324878692627, 0.0066111087799072266, 0.006881892681121826, 0.007152676582336426, 0.007423460483551025, 0.007694244384765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 11.0, 14.0, 23.0, 21.0, 36.0, 69.0, 111.0, 148.0, 246.0, 437.0, 647.0, 1129.0, 2040.0, 3773.0, 7799.0, 18102.0, 55884.0, 283558.0, 524194.0, 100624.0, 27790.0, 10707.0, 4913.0, 2619.0, 1489.0, 841.0, 485.0, 320.0, 177.0, 129.0, 67.0, 57.0, 30.0, 22.0, 16.0, 10.0, 4.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003894805908203125, -0.0037738680839538574, -0.00365293025970459, -0.0035319924354553223, -0.0034110546112060547, -0.003290116786956787, -0.0031691789627075195, -0.003048241138458252, -0.0029273033142089844, -0.002806365489959717, -0.0026854276657104492, -0.0025644898414611816, -0.002443552017211914, -0.0023226141929626465, -0.002201676368713379, -0.0020807385444641113, -0.0019598007202148438, -0.0018388628959655762, -0.0017179250717163086, -0.001596987247467041, -0.0014760494232177734, -0.0013551115989685059, -0.0012341737747192383, -0.0011132359504699707, -0.0009922981262207031, -0.0008713603019714355, -0.000750422477722168, -0.0006294846534729004, -0.0005085468292236328, -0.00038760900497436523, -0.00026667118072509766, -0.00014573335647583008, -2.47955322265625e-05, 9.614229202270508e-05, 0.00021708011627197266, 0.00033801794052124023, 0.0004589557647705078, 0.0005798935890197754, 0.000700831413269043, 0.0008217692375183105, 0.0009427070617675781, 0.0010636448860168457, 0.0011845827102661133, 0.0013055205345153809, 0.0014264583587646484, 0.001547396183013916, 0.0016683340072631836, 0.0017892718315124512, 0.0019102096557617188, 0.0020311474800109863, 0.002152085304260254, 0.0022730231285095215, 0.002393960952758789, 0.0025148987770080566, 0.0026358366012573242, 0.002756774425506592, 0.0028777122497558594, 0.002998650074005127, 0.0031195878982543945, 0.003240525722503662, 0.0033614635467529297, 0.0034824013710021973, 0.003603339195251465, 0.0037242770195007324, 0.00384521484375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 4.0, 5.0, 11.0, 7.0, 12.0, 14.0, 20.0, 20.0, 23.0, 37.0, 32.0, 35.0, 63.0, 70.0, 78.0, 95.0, 99.0, 79.0, 52.0, 54.0, 30.0, 32.0, 22.0, 23.0, 15.0, 9.0, 11.0, 7.0, 9.0, 7.0, 2.0, 4.0, 1.0, 5.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.678436279296875e-05, -8.363183587789536e-05, -8.047930896282196e-05, -7.732678204774857e-05, -7.417425513267517e-05, -7.102172821760178e-05, -6.786920130252838e-05, -6.471667438745499e-05, -6.156414747238159e-05, -5.84116205573082e-05, -5.52590936422348e-05, -5.210656672716141e-05, -4.895403981208801e-05, -4.580151289701462e-05, -4.264898598194122e-05, -3.949645906686783e-05, -3.6343932151794434e-05, -3.319140523672104e-05, -3.0038878321647644e-05, -2.688635140657425e-05, -2.3733824491500854e-05, -2.058129757642746e-05, -1.7428770661354065e-05, -1.427624374628067e-05, -1.1123716831207275e-05, -7.97118991613388e-06, -4.818663001060486e-06, -1.666136085987091e-06, 1.4863908290863037e-06, 4.6389177441596985e-06, 7.791444659233093e-06, 1.0943971574306488e-05, 1.4096498489379883e-05, 1.7249025404453278e-05, 2.0401552319526672e-05, 2.3554079234600067e-05, 2.6706606149673462e-05, 2.9859133064746857e-05, 3.301165997982025e-05, 3.6164186894893646e-05, 3.931671380996704e-05, 4.2469240725040436e-05, 4.562176764011383e-05, 4.8774294555187225e-05, 5.192682147026062e-05, 5.5079348385334015e-05, 5.823187530040741e-05, 6.13844022154808e-05, 6.45369291305542e-05, 6.76894560456276e-05, 7.084198296070099e-05, 7.399450987577438e-05, 7.714703679084778e-05, 8.029956370592117e-05, 8.345209062099457e-05, 8.660461753606796e-05, 8.975714445114136e-05, 9.290967136621475e-05, 9.606219828128815e-05, 9.921472519636154e-05, 0.00010236725211143494, 0.00010551977902650833, 0.00010867230594158173, 0.00011182483285665512, 0.00011497735977172852]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 10.0, 6.0, 10.0, 19.0, 22.0, 47.0, 76.0, 179.0, 441.0, 1266.0, 5070.0, 36708.0, 916258.0, 78009.0, 7639.0, 1770.0, 564.0, 217.0, 105.0, 50.0, 37.0, 27.0, 11.0, 4.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01641845703125, -0.01598203182220459, -0.01554560661315918, -0.01510918140411377, -0.01467275619506836, -0.01423633098602295, -0.013799905776977539, -0.013363480567932129, -0.012927055358886719, -0.012490630149841309, -0.012054204940795898, -0.011617779731750488, -0.011181354522705078, -0.010744929313659668, -0.010308504104614258, -0.009872078895568848, -0.009435653686523438, -0.008999228477478027, -0.008562803268432617, -0.008126378059387207, -0.007689952850341797, -0.007253527641296387, -0.0068171024322509766, -0.006380677223205566, -0.005944252014160156, -0.005507826805114746, -0.005071401596069336, -0.004634976387023926, -0.004198551177978516, -0.0037621259689331055, -0.0033257007598876953, -0.002889275550842285, -0.002452850341796875, -0.002016425132751465, -0.0015799999237060547, -0.0011435747146606445, -0.0007071495056152344, -0.0002707242965698242, 0.00016570091247558594, 0.0006021261215209961, 0.0010385513305664062, 0.0014749765396118164, 0.0019114017486572266, 0.0023478269577026367, 0.002784252166748047, 0.003220677375793457, 0.003657102584838867, 0.004093527793884277, 0.0045299530029296875, 0.004966378211975098, 0.005402803421020508, 0.005839228630065918, 0.006275653839111328, 0.006712079048156738, 0.0071485042572021484, 0.007584929466247559, 0.008021354675292969, 0.008457779884338379, 0.008894205093383789, 0.0093306303024292, 0.00976705551147461, 0.01020348072052002, 0.01063990592956543, 0.01107633113861084, 0.01151275634765625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 4.0, 4.0, 8.0, 3.0, 9.0, 10.0, 15.0, 20.0, 22.0, 31.0, 36.0, 51.0, 76.0, 93.0, 122.0, 119.0, 88.0, 65.0, 58.0, 31.0, 26.0, 30.0, 22.0, 11.0, 9.0, 6.0, 9.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004467010498046875, -0.004318296909332275, -0.004169583320617676, -0.004020869731903076, -0.0038721561431884766, -0.003723442554473877, -0.0035747289657592773, -0.0034260153770446777, -0.003277301788330078, -0.0031285881996154785, -0.002979874610900879, -0.0028311610221862793, -0.0026824474334716797, -0.00253373384475708, -0.0023850202560424805, -0.002236306667327881, -0.0020875930786132812, -0.0019388794898986816, -0.001790165901184082, -0.0016414523124694824, -0.0014927387237548828, -0.0013440251350402832, -0.0011953115463256836, -0.001046597957611084, -0.0008978843688964844, -0.0007491707801818848, -0.0006004571914672852, -0.00045174360275268555, -0.00030303001403808594, -0.00015431642532348633, -5.602836608886719e-06, 0.0001431107521057129, 0.0002918243408203125, 0.0004405379295349121, 0.0005892515182495117, 0.0007379651069641113, 0.0008866786956787109, 0.0010353922843933105, 0.0011841058731079102, 0.0013328194618225098, 0.0014815330505371094, 0.001630246639251709, 0.0017789602279663086, 0.0019276738166809082, 0.002076387405395508, 0.0022251009941101074, 0.002373814582824707, 0.0025225281715393066, 0.0026712417602539062, 0.002819955348968506, 0.0029686689376831055, 0.003117382526397705, 0.0032660961151123047, 0.0034148097038269043, 0.003563523292541504, 0.0037122368812561035, 0.003860950469970703, 0.004009664058685303, 0.004158377647399902, 0.004307091236114502, 0.0044558048248291016, 0.004604518413543701, 0.004753232002258301, 0.0049019455909729, 0.0050506591796875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 10.0, 41.0, 252.0, 498.0, 172.0, 28.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20557162165641785, -0.20172464847564697, -0.1978776752948761, -0.19403070211410522, -0.19018372893333435, -0.18633675575256348, -0.1824897825717926, -0.17864280939102173, -0.17479583621025085, -0.17094886302947998, -0.1671018898487091, -0.16325491666793823, -0.15940794348716736, -0.15556097030639648, -0.1517139971256256, -0.14786702394485474, -0.14402005076408386, -0.140173077583313, -0.13632610440254211, -0.13247913122177124, -0.12863215804100037, -0.12478518486022949, -0.12093821167945862, -0.11709123849868774, -0.11324426531791687, -0.109397292137146, -0.10555031895637512, -0.10170334577560425, -0.09785637259483337, -0.0940093994140625, -0.09016242623329163, -0.08631545305252075, -0.08246848732233047, -0.0786215141415596, -0.07477454096078873, -0.07092756778001785, -0.06708059459924698, -0.0632336214184761, -0.05938664823770523, -0.05553967505693436, -0.05169270187616348, -0.04784572869539261, -0.043998755514621735, -0.04015178233385086, -0.03630480915307999, -0.03245783597230911, -0.02861086279153824, -0.024763889610767365, -0.02091691642999649, -0.017069943249225616, -0.013222970068454742, -0.009375996887683868, -0.005529023706912994, -0.0016820505261421204, 0.0021649226546287537, 0.006011895835399628, 0.009858869016170502, 0.013705842196941376, 0.01755281537771225, 0.021399788558483124, 0.025246761739253998, 0.029093734920024872, 0.032940708100795746, 0.03678768128156662, 0.040634654462337494]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 8.0, 3.0, 4.0, 6.0, 7.0, 9.0, 6.0, 8.0, 15.0, 12.0, 21.0, 15.0, 24.0, 36.0, 26.0, 18.0, 22.0, 24.0, 25.0, 29.0, 35.0, 32.0, 44.0, 50.0, 41.0, 32.0, 23.0, 36.0, 37.0, 31.0, 24.0, 26.0, 28.0, 26.0, 21.0, 20.0, 22.0, 21.0, 29.0, 18.0, 21.0, 19.0, 8.0, 10.0, 12.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.019398212432861328, -0.018790343776345253, -0.018182475119829178, -0.017574606463313103, -0.016966737806797028, -0.016358869150280952, -0.015751000493764877, -0.015143131837248802, -0.014535263180732727, -0.013927394524216652, -0.013319525867700577, -0.012711657211184502, -0.012103788554668427, -0.011495919898152351, -0.010888051241636276, -0.010280182585120201, -0.009672313928604126, -0.00906444527208805, -0.008456576615571976, -0.0078487079590559, -0.0072408393025398254, -0.00663297064602375, -0.006025101989507675, -0.0054172333329916, -0.004809364676475525, -0.00420149601995945, -0.0035936273634433746, -0.0029857587069272995, -0.0023778900504112244, -0.0017700213938951492, -0.001162152737379074, -0.000554284080862999, 5.358457565307617e-05, 0.0006614532321691513, 0.0012693218886852264, 0.0018771905452013016, 0.0024850592017173767, 0.003092927858233452, 0.003700796514749527, 0.004308665171265602, 0.004916533827781677, 0.005524402484297752, 0.0061322711408138275, 0.006740139797329903, 0.007348008453845978, 0.007955877110362053, 0.008563745766878128, 0.009171614423394203, 0.009779483079910278, 0.010387351736426353, 0.010995220392942429, 0.011603089049458504, 0.012210957705974579, 0.012818826362490654, 0.013426695019006729, 0.014034563675522804, 0.01464243233203888, 0.015250300988554955, 0.01585816964507103, 0.016466038301587105, 0.01707390695810318, 0.017681775614619255, 0.01828964427113533, 0.018897512927651405, 0.01950538158416748]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 3.0, 9.0, 6.0, 6.0, 10.0, 7.0, 16.0, 15.0, 29.0, 32.0, 31.0, 65.0, 75.0, 120.0, 190.0, 263.0, 449.0, 1158.0, 11945.0, 4082944.0, 90543.0, 3999.0, 1608.0, 392.0, 145.0, 69.0, 45.0, 35.0, 18.0, 11.0, 10.0, 7.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03759765625, -0.036545753479003906, -0.03549385070800781, -0.03444194793701172, -0.033390045166015625, -0.03233814239501953, -0.03128623962402344, -0.030234336853027344, -0.02918243408203125, -0.028130531311035156, -0.027078628540039062, -0.02602672576904297, -0.024974822998046875, -0.02392292022705078, -0.022871017456054688, -0.021819114685058594, -0.0207672119140625, -0.019715309143066406, -0.018663406372070312, -0.01761150360107422, -0.016559600830078125, -0.015507698059082031, -0.014455795288085938, -0.013403892517089844, -0.01235198974609375, -0.011300086975097656, -0.010248184204101562, -0.009196281433105469, -0.008144378662109375, -0.007092475891113281, -0.0060405731201171875, -0.004988670349121094, -0.003936767578125, -0.0028848648071289062, -0.0018329620361328125, -0.0007810592651367188, 0.000270843505859375, 0.0013227462768554688, 0.0023746490478515625, 0.0034265518188476562, 0.00447845458984375, 0.005530357360839844, 0.0065822601318359375, 0.007634162902832031, 0.008686065673828125, 0.009737968444824219, 0.010789871215820312, 0.011841773986816406, 0.0128936767578125, 0.013945579528808594, 0.014997482299804688, 0.01604938507080078, 0.017101287841796875, 0.01815319061279297, 0.019205093383789062, 0.020256996154785156, 0.02130889892578125, 0.022360801696777344, 0.023412704467773438, 0.02446460723876953, 0.025516510009765625, 0.02656841278076172, 0.027620315551757812, 0.028672218322753906, 0.02972412109375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 5.0, 48.0, 180.0, 363.0, 325.0, 66.0, 19.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0234222412109375, -0.022873759269714355, -0.02232527732849121, -0.021776795387268066, -0.021228313446044922, -0.020679831504821777, -0.020131349563598633, -0.01958286762237549, -0.019034385681152344, -0.0184859037399292, -0.017937421798706055, -0.01738893985748291, -0.016840457916259766, -0.01629197597503662, -0.015743494033813477, -0.015195012092590332, -0.014646530151367188, -0.014098048210144043, -0.013549566268920898, -0.013001084327697754, -0.01245260238647461, -0.011904120445251465, -0.01135563850402832, -0.010807156562805176, -0.010258674621582031, -0.009710192680358887, -0.009161710739135742, -0.008613228797912598, -0.008064746856689453, -0.007516264915466309, -0.006967782974243164, -0.0064193010330200195, -0.005870819091796875, -0.0053223371505737305, -0.004773855209350586, -0.004225373268127441, -0.003676891326904297, -0.0031284093856811523, -0.002579927444458008, -0.0020314455032348633, -0.0014829635620117188, -0.0009344816207885742, -0.0003859996795654297, 0.00016248226165771484, 0.0007109642028808594, 0.001259446144104004, 0.0018079280853271484, 0.002356410026550293, 0.0029048919677734375, 0.003453373908996582, 0.0040018558502197266, 0.004550337791442871, 0.005098819732666016, 0.00564730167388916, 0.006195783615112305, 0.006744265556335449, 0.007292747497558594, 0.007841229438781738, 0.008389711380004883, 0.008938193321228027, 0.009486675262451172, 0.010035157203674316, 0.010583639144897461, 0.011132121086120605, 0.01168060302734375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 7.0, 1.0, 6.0, 8.0, 15.0, 21.0, 34.0, 56.0, 95.0, 144.0, 303.0, 532.0, 1022.0, 2276.0, 7146.0, 35732.0, 440979.0, 3525359.0, 153132.0, 19055.0, 4764.0, 1682.0, 841.0, 433.0, 251.0, 149.0, 75.0, 48.0, 33.0, 16.0, 12.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00896453857421875, -0.008695483207702637, -0.008426427841186523, -0.00815737247467041, -0.007888317108154297, -0.007619261741638184, -0.00735020637512207, -0.007081151008605957, -0.006812095642089844, -0.0065430402755737305, -0.006273984909057617, -0.006004929542541504, -0.005735874176025391, -0.005466818809509277, -0.005197763442993164, -0.004928708076477051, -0.0046596527099609375, -0.004390597343444824, -0.004121541976928711, -0.0038524866104125977, -0.0035834312438964844, -0.003314375877380371, -0.003045320510864258, -0.0027762651443481445, -0.0025072097778320312, -0.002238154411315918, -0.0019690990447998047, -0.0017000436782836914, -0.0014309883117675781, -0.0011619329452514648, -0.0008928775787353516, -0.0006238222122192383, -0.000354766845703125, -8.571147918701172e-05, 0.00018334388732910156, 0.00045239925384521484, 0.0007214546203613281, 0.0009905099868774414, 0.0012595653533935547, 0.001528620719909668, 0.0017976760864257812, 0.0020667314529418945, 0.002335786819458008, 0.002604842185974121, 0.0028738975524902344, 0.0031429529190063477, 0.003412008285522461, 0.0036810636520385742, 0.0039501190185546875, 0.004219174385070801, 0.004488229751586914, 0.004757285118103027, 0.005026340484619141, 0.005295395851135254, 0.005564451217651367, 0.0058335065841674805, 0.006102561950683594, 0.006371617317199707, 0.00664067268371582, 0.006909728050231934, 0.007178783416748047, 0.00744783878326416, 0.0077168941497802734, 0.007985949516296387, 0.0082550048828125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 2.0, 3.0, 10.0, 4.0, 10.0, 7.0, 24.0, 24.0, 46.0, 55.0, 109.0, 208.0, 491.0, 924.0, 1001.0, 442.0, 246.0, 151.0, 86.0, 74.0, 57.0, 31.0, 26.0, 15.0, 9.0, 7.0, 3.0, 0.0, 5.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00601959228515625, -0.0058190226554870605, -0.005618453025817871, -0.005417883396148682, -0.005217313766479492, -0.005016744136810303, -0.004816174507141113, -0.004615604877471924, -0.004415035247802734, -0.004214465618133545, -0.0040138959884643555, -0.003813326358795166, -0.0036127567291259766, -0.003412187099456787, -0.0032116174697875977, -0.003011047840118408, -0.0028104782104492188, -0.0026099085807800293, -0.00240933895111084, -0.0022087693214416504, -0.002008199691772461, -0.0018076300621032715, -0.001607060432434082, -0.0014064908027648926, -0.0012059211730957031, -0.0010053515434265137, -0.0008047819137573242, -0.0006042122840881348, -0.0004036426544189453, -0.00020307302474975586, -2.5033950805664062e-06, 0.00019806623458862305, 0.0003986358642578125, 0.000599205493927002, 0.0007997751235961914, 0.0010003447532653809, 0.0012009143829345703, 0.0014014840126037598, 0.0016020536422729492, 0.0018026232719421387, 0.002003192901611328, 0.0022037625312805176, 0.002404332160949707, 0.0026049017906188965, 0.002805471420288086, 0.0030060410499572754, 0.003206610679626465, 0.0034071803092956543, 0.0036077499389648438, 0.003808319568634033, 0.004008889198303223, 0.004209458827972412, 0.0044100284576416016, 0.004610598087310791, 0.0048111677169799805, 0.00501173734664917, 0.005212306976318359, 0.005412876605987549, 0.005613446235656738, 0.005814015865325928, 0.006014585494995117, 0.006215155124664307, 0.006415724754333496, 0.0066162943840026855, 0.006816864013671875]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 5.0, 22.0, 202.0, 498.0, 215.0, 42.0, 9.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1130090057849884, -0.1101374477148056, -0.1072658896446228, -0.10439433157444, -0.1015227735042572, -0.098651222884655, -0.0957796648144722, -0.0929081067442894, -0.0900365486741066, -0.0871649906039238, -0.084293432533741, -0.0814218744635582, -0.078550323843956, -0.0756787657737732, -0.0728072077035904, -0.06993564963340759, -0.06706409156322479, -0.06419253349304199, -0.06132097542285919, -0.05844942107796669, -0.05557786300778389, -0.05270630493760109, -0.04983475059270859, -0.04696319252252579, -0.04409163445234299, -0.04122007638216019, -0.038348518311977386, -0.035476963967084885, -0.032605405896902084, -0.029733847826719284, -0.026862291619181633, -0.023990735411643982, -0.02111917734146118, -0.01824761927127838, -0.01537606306374073, -0.012504505924880505, -0.009632948786020279, -0.006761391647160053, -0.0038898345082998276, -0.0010182783007621765, 0.0018532797694206238, 0.0047248369082808495, 0.007596394047141075, 0.0104679511860013, 0.013339508324861526, 0.016211066395044327, 0.019082622602581978, 0.02195417881011963, 0.02482573688030243, 0.02769729495048523, 0.03056885115802288, 0.03344040736556053, 0.03631196543574333, 0.03918352350592613, 0.042055077850818634, 0.044926635921001434, 0.047798193991184235, 0.050669752061367035, 0.053541310131549835, 0.05641286447644234, 0.05928442254662514, 0.06215598061680794, 0.06502753496170044, 0.06789909303188324, 0.07077065110206604]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 4.0, 7.0, 4.0, 10.0, 17.0, 10.0, 18.0, 20.0, 25.0, 40.0, 52.0, 48.0, 46.0, 69.0, 51.0, 56.0, 61.0, 76.0, 60.0, 48.0, 49.0, 36.0, 50.0, 33.0, 25.0, 20.0, 16.0, 9.0, 17.0, 9.0, 4.0, 3.0, 3.0, 8.0, 5.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.02691507339477539, -0.02626679465174675, -0.02561851590871811, -0.02497023716568947, -0.024321958422660828, -0.023673679679632187, -0.023025400936603546, -0.022377122193574905, -0.021728843450546265, -0.021080564707517624, -0.020432285964488983, -0.019784007221460342, -0.0191357284784317, -0.01848744973540306, -0.01783917099237442, -0.01719089224934578, -0.01654261350631714, -0.015894334763288498, -0.015246056020259857, -0.014597777277231216, -0.013949498534202576, -0.013301219791173935, -0.012652941048145294, -0.012004662305116653, -0.011356383562088013, -0.010708104819059372, -0.010059826076030731, -0.00941154733300209, -0.00876326858997345, -0.008114989846944809, -0.007466711103916168, -0.0068184323608875275, -0.006170153617858887, -0.005521874874830246, -0.004873596131801605, -0.0042253173887729645, -0.0035770386457443237, -0.002928759902715683, -0.0022804811596870422, -0.0016322024166584015, -0.0009839236736297607, -0.00033564493060112, 0.00031263381242752075, 0.0009609125554561615, 0.0016091912984848022, 0.002257470041513443, 0.0029057487845420837, 0.0035540275275707245, 0.004202306270599365, 0.004850585013628006, 0.005498863756656647, 0.0061471424996852875, 0.006795421242713928, 0.007443699985742569, 0.00809197872877121, 0.00874025747179985, 0.009388536214828491, 0.010036814957857132, 0.010685093700885773, 0.011333372443914413, 0.011981651186943054, 0.012629929929971695, 0.013278208673000336, 0.013926487416028976, 0.014574766159057617]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 6.0, 3.0, 11.0, 15.0, 18.0, 23.0, 31.0, 38.0, 54.0, 64.0, 111.0, 117.0, 218.0, 326.0, 517.0, 930.0, 2786.0, 46586.0, 930559.0, 60413.0, 3041.0, 1055.0, 542.0, 355.0, 207.0, 151.0, 99.0, 93.0, 51.0, 36.0, 26.0, 17.0, 10.0, 13.0, 9.0, 5.0, 3.0, 4.0, 1.0, 4.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0220794677734375, -0.021277427673339844, -0.020475387573242188, -0.01967334747314453, -0.018871307373046875, -0.01806926727294922, -0.017267227172851562, -0.016465187072753906, -0.01566314697265625, -0.014861106872558594, -0.014059066772460938, -0.013257026672363281, -0.012454986572265625, -0.011652946472167969, -0.010850906372070312, -0.010048866271972656, -0.009246826171875, -0.008444786071777344, -0.0076427459716796875, -0.006840705871582031, -0.006038665771484375, -0.005236625671386719, -0.0044345855712890625, -0.0036325454711914062, -0.00283050537109375, -0.0020284652709960938, -0.0012264251708984375, -0.00042438507080078125, 0.000377655029296875, 0.0011796951293945312, 0.0019817352294921875, 0.0027837753295898438, 0.0035858154296875, 0.004387855529785156, 0.0051898956298828125, 0.005991935729980469, 0.006793975830078125, 0.007596015930175781, 0.008398056030273438, 0.009200096130371094, 0.01000213623046875, 0.010804176330566406, 0.011606216430664062, 0.012408256530761719, 0.013210296630859375, 0.014012336730957031, 0.014814376831054688, 0.015616416931152344, 0.01641845703125, 0.017220497131347656, 0.018022537231445312, 0.01882457733154297, 0.019626617431640625, 0.02042865753173828, 0.021230697631835938, 0.022032737731933594, 0.02283477783203125, 0.023636817932128906, 0.024438858032226562, 0.02524089813232422, 0.026042938232421875, 0.02684497833251953, 0.027647018432617188, 0.028449058532714844, 0.0292510986328125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 77.0, 239.0, 368.0, 260.0, 46.0, 9.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022552490234375, -0.022008657455444336, -0.021464824676513672, -0.020920991897583008, -0.020377159118652344, -0.01983332633972168, -0.019289493560791016, -0.01874566078186035, -0.018201828002929688, -0.017657995223999023, -0.01711416244506836, -0.016570329666137695, -0.01602649688720703, -0.015482664108276367, -0.014938831329345703, -0.014394998550415039, -0.013851165771484375, -0.013307332992553711, -0.012763500213623047, -0.012219667434692383, -0.011675834655761719, -0.011132001876831055, -0.01058816909790039, -0.010044336318969727, -0.009500503540039062, -0.008956670761108398, -0.008412837982177734, -0.00786900520324707, -0.007325172424316406, -0.006781339645385742, -0.006237506866455078, -0.005693674087524414, -0.00514984130859375, -0.004606008529663086, -0.004062175750732422, -0.003518342971801758, -0.0029745101928710938, -0.0024306774139404297, -0.0018868446350097656, -0.0013430118560791016, -0.0007991790771484375, -0.00025534629821777344, 0.0002884864807128906, 0.0008323192596435547, 0.0013761520385742188, 0.0019199848175048828, 0.002463817596435547, 0.003007650375366211, 0.003551483154296875, 0.004095315933227539, 0.004639148712158203, 0.005182981491088867, 0.005726814270019531, 0.006270647048950195, 0.006814479827880859, 0.0073583126068115234, 0.007902145385742188, 0.008445978164672852, 0.008989810943603516, 0.00953364372253418, 0.010077476501464844, 0.010621309280395508, 0.011165142059326172, 0.011708974838256836, 0.0122528076171875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 9.0, 11.0, 14.0, 10.0, 18.0, 32.0, 47.0, 48.0, 79.0, 108.0, 150.0, 231.0, 391.0, 676.0, 1606.0, 5077.0, 22084.0, 132401.0, 542433.0, 283023.0, 46188.0, 9044.0, 2481.0, 988.0, 470.0, 285.0, 207.0, 123.0, 89.0, 60.0, 41.0, 39.0, 23.0, 16.0, 9.0, 8.0, 11.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0084686279296875, -0.008192896842956543, -0.007917165756225586, -0.007641434669494629, -0.007365703582763672, -0.007089972496032715, -0.006814241409301758, -0.006538510322570801, -0.006262779235839844, -0.005987048149108887, -0.00571131706237793, -0.005435585975646973, -0.005159854888916016, -0.004884123802185059, -0.0046083927154541016, -0.0043326616287231445, -0.0040569305419921875, -0.0037811994552612305, -0.0035054683685302734, -0.0032297372817993164, -0.0029540061950683594, -0.0026782751083374023, -0.0024025440216064453, -0.0021268129348754883, -0.0018510818481445312, -0.0015753507614135742, -0.0012996196746826172, -0.0010238885879516602, -0.0007481575012207031, -0.0004724264144897461, -0.00019669532775878906, 7.903575897216797e-05, 0.000354766845703125, 0.000630497932434082, 0.0009062290191650391, 0.001181960105895996, 0.0014576911926269531, 0.0017334222793579102, 0.002009153366088867, 0.0022848844528198242, 0.0025606155395507812, 0.0028363466262817383, 0.0031120777130126953, 0.0033878087997436523, 0.0036635398864746094, 0.003939270973205566, 0.0042150020599365234, 0.0044907331466674805, 0.0047664642333984375, 0.0050421953201293945, 0.0053179264068603516, 0.005593657493591309, 0.005869388580322266, 0.006145119667053223, 0.00642085075378418, 0.006696581840515137, 0.006972312927246094, 0.007248044013977051, 0.007523775100708008, 0.007799506187438965, 0.008075237274169922, 0.008350968360900879, 0.008626699447631836, 0.008902430534362793, 0.00917816162109375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 6.0, 3.0, 4.0, 5.0, 10.0, 9.0, 9.0, 16.0, 17.0, 22.0, 30.0, 18.0, 37.0, 34.0, 41.0, 45.0, 45.0, 49.0, 64.0, 45.0, 55.0, 51.0, 52.0, 44.0, 40.0, 37.0, 29.0, 39.0, 27.0, 17.0, 19.0, 17.0, 12.0, 13.0, 12.0, 5.0, 9.0, 6.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007137298583984375, -0.006920218467712402, -0.00670313835144043, -0.006486058235168457, -0.006268978118896484, -0.006051898002624512, -0.005834817886352539, -0.005617737770080566, -0.005400657653808594, -0.005183577537536621, -0.0049664974212646484, -0.004749417304992676, -0.004532337188720703, -0.0043152570724487305, -0.004098176956176758, -0.003881096839904785, -0.0036640167236328125, -0.00344693660736084, -0.003229856491088867, -0.0030127763748168945, -0.002795696258544922, -0.0025786161422729492, -0.0023615360260009766, -0.002144455909729004, -0.0019273757934570312, -0.0017102956771850586, -0.001493215560913086, -0.0012761354446411133, -0.0010590553283691406, -0.000841975212097168, -0.0006248950958251953, -0.00040781497955322266, -0.00019073486328125, 2.6345252990722656e-05, 0.0002434253692626953, 0.00046050548553466797, 0.0006775856018066406, 0.0008946657180786133, 0.001111745834350586, 0.0013288259506225586, 0.0015459060668945312, 0.001762986183166504, 0.0019800662994384766, 0.0021971464157104492, 0.002414226531982422, 0.0026313066482543945, 0.002848386764526367, 0.00306546688079834, 0.0032825469970703125, 0.003499627113342285, 0.003716707229614258, 0.0039337873458862305, 0.004150867462158203, 0.004367947578430176, 0.0045850276947021484, 0.004802107810974121, 0.005019187927246094, 0.005236268043518066, 0.005453348159790039, 0.005670428276062012, 0.005887508392333984, 0.006104588508605957, 0.00632166862487793, 0.006538748741149902, 0.006755828857421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 7.0, 10.0, 17.0, 25.0, 40.0, 68.0, 128.0, 247.0, 395.0, 788.0, 1643.0, 3703.0, 9061.0, 26078.0, 100400.0, 508473.0, 308045.0, 60009.0, 17421.0, 6587.0, 2760.0, 1294.0, 611.0, 297.0, 192.0, 105.0, 64.0, 19.0, 26.0, 10.0, 6.0, 8.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.003997802734375, -0.0038830041885375977, -0.0037682056427001953, -0.003653407096862793, -0.0035386085510253906, -0.0034238100051879883, -0.003309011459350586, -0.0031942129135131836, -0.0030794143676757812, -0.002964615821838379, -0.0028498172760009766, -0.0027350187301635742, -0.002620220184326172, -0.0025054216384887695, -0.002390623092651367, -0.002275824546813965, -0.0021610260009765625, -0.00204622745513916, -0.0019314289093017578, -0.0018166303634643555, -0.0017018318176269531, -0.0015870332717895508, -0.0014722347259521484, -0.001357436180114746, -0.0012426376342773438, -0.0011278390884399414, -0.001013040542602539, -0.0008982419967651367, -0.0007834434509277344, -0.000668644905090332, -0.0005538463592529297, -0.00043904781341552734, -0.000324249267578125, -0.00020945072174072266, -9.465217590332031e-05, 2.014636993408203e-05, 0.00013494491577148438, 0.0002497434616088867, 0.00036454200744628906, 0.0004793405532836914, 0.0005941390991210938, 0.0007089376449584961, 0.0008237361907958984, 0.0009385347366333008, 0.0010533332824707031, 0.0011681318283081055, 0.0012829303741455078, 0.0013977289199829102, 0.0015125274658203125, 0.0016273260116577148, 0.0017421245574951172, 0.0018569231033325195, 0.001971721649169922, 0.0020865201950073242, 0.0022013187408447266, 0.002316117286682129, 0.0024309158325195312, 0.0025457143783569336, 0.002660512924194336, 0.0027753114700317383, 0.0028901100158691406, 0.003004908561706543, 0.0031197071075439453, 0.0032345056533813477, 0.00334930419921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 4.0, 7.0, 9.0, 17.0, 4.0, 19.0, 25.0, 42.0, 57.0, 77.0, 85.0, 87.0, 80.0, 100.0, 93.0, 72.0, 64.0, 35.0, 28.0, 28.0, 17.0, 11.0, 10.0, 6.0, 5.0, 8.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00010597705841064453, -0.00010283943265676498, -9.970180690288544e-05, -9.656418114900589e-05, -9.342655539512634e-05, -9.02889296412468e-05, -8.715130388736725e-05, -8.40136781334877e-05, -8.087605237960815e-05, -7.773842662572861e-05, -7.460080087184906e-05, -7.146317511796951e-05, -6.832554936408997e-05, -6.518792361021042e-05, -6.205029785633087e-05, -5.8912672102451324e-05, -5.577504634857178e-05, -5.263742059469223e-05, -4.949979484081268e-05, -4.6362169086933136e-05, -4.322454333305359e-05, -4.008691757917404e-05, -3.6949291825294495e-05, -3.381166607141495e-05, -3.06740403175354e-05, -2.7536414563655853e-05, -2.4398788809776306e-05, -2.126116305589676e-05, -1.8123537302017212e-05, -1.4985911548137665e-05, -1.1848285794258118e-05, -8.71066004037857e-06, -5.5730342864990234e-06, -2.4354085326194763e-06, 7.022172212600708e-07, 3.839842975139618e-06, 6.977468729019165e-06, 1.0115094482898712e-05, 1.325272023677826e-05, 1.6390345990657806e-05, 1.9527971744537354e-05, 2.26655974984169e-05, 2.5803223252296448e-05, 2.8940849006175995e-05, 3.207847476005554e-05, 3.521610051393509e-05, 3.8353726267814636e-05, 4.149135202169418e-05, 4.462897777557373e-05, 4.776660352945328e-05, 5.0904229283332825e-05, 5.404185503721237e-05, 5.717948079109192e-05, 6.0317106544971466e-05, 6.345473229885101e-05, 6.659235805273056e-05, 6.972998380661011e-05, 7.286760956048965e-05, 7.60052353143692e-05, 7.914286106824875e-05, 8.22804868221283e-05, 8.541811257600784e-05, 8.855573832988739e-05, 9.169336408376694e-05, 9.483098983764648e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 2.0, 5.0, 8.0, 11.0, 14.0, 23.0, 33.0, 56.0, 101.0, 213.0, 451.0, 1315.0, 5551.0, 34861.0, 575812.0, 396920.0, 26504.0, 4656.0, 1172.0, 388.0, 163.0, 108.0, 53.0, 38.0, 23.0, 23.0, 7.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00870513916015625, -0.008462905883789062, -0.008220672607421875, -0.007978439331054688, -0.0077362060546875, -0.0074939727783203125, -0.007251739501953125, -0.0070095062255859375, -0.00676727294921875, -0.0065250396728515625, -0.006282806396484375, -0.0060405731201171875, -0.00579833984375, -0.0055561065673828125, -0.005313873291015625, -0.0050716400146484375, -0.00482940673828125, -0.0045871734619140625, -0.004344940185546875, -0.0041027069091796875, -0.0038604736328125, -0.0036182403564453125, -0.003376007080078125, -0.0031337738037109375, -0.00289154052734375, -0.0026493072509765625, -0.002407073974609375, -0.0021648406982421875, -0.001922607421875, -0.0016803741455078125, -0.001438140869140625, -0.0011959075927734375, -0.00095367431640625, -0.0007114410400390625, -0.000469207763671875, -0.0002269744873046875, 1.52587890625e-05, 0.0002574920654296875, 0.000499725341796875, 0.0007419586181640625, 0.00098419189453125, 0.0012264251708984375, 0.001468658447265625, 0.0017108917236328125, 0.001953125, 0.0021953582763671875, 0.002437591552734375, 0.0026798248291015625, 0.00292205810546875, 0.0031642913818359375, 0.003406524658203125, 0.0036487579345703125, 0.0038909912109375, 0.0041332244873046875, 0.004375457763671875, 0.0046176910400390625, 0.00485992431640625, 0.0051021575927734375, 0.005344390869140625, 0.0055866241455078125, 0.005828857421875, 0.0060710906982421875, 0.006313323974609375, 0.0065555572509765625, 0.00679779052734375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 7.0, 8.0, 7.0, 11.0, 20.0, 19.0, 32.0, 52.0, 68.0, 89.0, 115.0, 118.0, 107.0, 91.0, 72.0, 48.0, 36.0, 22.0, 21.0, 8.0, 6.0, 17.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004444122314453125, -0.004278361797332764, -0.004112601280212402, -0.003946840763092041, -0.0037810802459716797, -0.0036153197288513184, -0.003449559211730957, -0.0032837986946105957, -0.0031180381774902344, -0.002952277660369873, -0.0027865171432495117, -0.0026207566261291504, -0.002454996109008789, -0.0022892355918884277, -0.0021234750747680664, -0.001957714557647705, -0.0017919540405273438, -0.0016261935234069824, -0.001460433006286621, -0.0012946724891662598, -0.0011289119720458984, -0.0009631514549255371, -0.0007973909378051758, -0.0006316304206848145, -0.0004658699035644531, -0.0003001093864440918, -0.00013434886932373047, 3.141164779663086e-05, 0.0001971721649169922, 0.0003629326820373535, 0.0005286931991577148, 0.0006944537162780762, 0.0008602142333984375, 0.0010259747505187988, 0.0011917352676391602, 0.0013574957847595215, 0.0015232563018798828, 0.0016890168190002441, 0.0018547773361206055, 0.002020537853240967, 0.002186298370361328, 0.0023520588874816895, 0.0025178194046020508, 0.002683579921722412, 0.0028493404388427734, 0.0030151009559631348, 0.003180861473083496, 0.0033466219902038574, 0.0035123825073242188, 0.00367814302444458, 0.0038439035415649414, 0.004009664058685303, 0.004175424575805664, 0.004341185092926025, 0.004506945610046387, 0.004672706127166748, 0.004838466644287109, 0.005004227161407471, 0.005169987678527832, 0.005335748195648193, 0.005501508712768555, 0.005667269229888916, 0.005833029747009277, 0.005998790264129639, 0.00616455078125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 10.0, 36.0, 242.0, 475.0, 192.0, 36.0, 9.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14934255182743073, -0.1461886465549469, -0.14303475618362427, -0.13988085091114044, -0.13672694563865662, -0.1335730403661728, -0.13041914999485016, -0.12726524472236633, -0.12411133944988251, -0.12095744162797928, -0.11780353635549545, -0.11464963853359222, -0.1114957332611084, -0.10834183543920517, -0.10518793016672134, -0.10203403234481812, -0.09888012707233429, -0.09572622925043106, -0.09257232397794724, -0.089418426156044, -0.08626452088356018, -0.08311062306165695, -0.07995671778917313, -0.0768028199672699, -0.07364892214536667, -0.07049502432346344, -0.06734111905097961, -0.06418722122907639, -0.06103331595659256, -0.05787941813468933, -0.054725512862205505, -0.05157161504030228, -0.04841770976781845, -0.045263808220624924, -0.042109906673431396, -0.03895600512623787, -0.03580210357904434, -0.03264820575714111, -0.029494302347302437, -0.02634040080010891, -0.023186499252915382, -0.020032597705721855, -0.016878696158528328, -0.013724795542657375, -0.010570893995463848, -0.0074169933795928955, -0.004263091832399368, -0.001109190285205841, 0.002044711261987686, 0.005198612809181213, 0.00835251435637474, 0.011506414972245693, 0.01466031651943922, 0.017814217135310173, 0.0209681186825037, 0.024122020229697227, 0.027275921776890755, 0.030429823324084282, 0.03358372300863266, 0.03673762455582619, 0.039891526103019714, 0.04304542765021324, 0.04619932919740677, 0.049353230744600296, 0.05250713229179382]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 6.0, 7.0, 4.0, 5.0, 5.0, 10.0, 11.0, 10.0, 7.0, 15.0, 17.0, 12.0, 17.0, 14.0, 32.0, 22.0, 26.0, 31.0, 24.0, 30.0, 36.0, 39.0, 35.0, 34.0, 41.0, 33.0, 44.0, 44.0, 26.0, 38.0, 33.0, 34.0, 29.0, 28.0, 35.0, 28.0, 19.0, 17.0, 15.0, 14.0, 13.0, 19.0, 8.0, 9.0, 7.0, 4.0, 6.0, 8.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015686094760894775, -0.015170760452747345, -0.014655426144599915, -0.014140091836452484, -0.013624757528305054, -0.013109423220157623, -0.012594088912010193, -0.012078754603862762, -0.011563420295715332, -0.011048085987567902, -0.010532751679420471, -0.01001741737127304, -0.00950208306312561, -0.00898674875497818, -0.00847141444683075, -0.007956080138683319, -0.007440745830535889, -0.006925411522388458, -0.006410077214241028, -0.005894742906093597, -0.005379408597946167, -0.004864074289798737, -0.004348739981651306, -0.0038334056735038757, -0.0033180713653564453, -0.002802737057209015, -0.0022874027490615845, -0.001772068440914154, -0.0012567341327667236, -0.0007413998246192932, -0.0002260655164718628, 0.0002892687916755676, 0.000804603099822998, 0.0013199374079704285, 0.0018352717161178589, 0.0023506060242652893, 0.0028659403324127197, 0.00338127464056015, 0.0038966089487075806, 0.004411943256855011, 0.004927277565002441, 0.005442611873149872, 0.005957946181297302, 0.006473280489444733, 0.006988614797592163, 0.0075039491057395935, 0.008019283413887024, 0.008534617722034454, 0.009049952030181885, 0.009565286338329315, 0.010080620646476746, 0.010595954954624176, 0.011111289262771606, 0.011626623570919037, 0.012141957879066467, 0.012657292187213898, 0.013172626495361328, 0.013687960803508759, 0.014203295111656189, 0.01471862941980362, 0.01523396372795105, 0.01574929803609848, 0.01626463234424591, 0.01677996665239334, 0.01729530096054077]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 6.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 15.0, 13.0, 13.0, 11.0, 14.0, 21.0, 22.0, 29.0, 31.0, 48.0, 67.0, 111.0, 139.0, 215.0, 334.0, 1424.0, 9056.0, 2571804.0, 1599441.0, 7855.0, 1774.0, 976.0, 492.0, 142.0, 61.0, 42.0, 33.0, 16.0, 23.0, 9.0, 6.0, 1.0, 3.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0], "bins": [-0.0273590087890625, -0.02663874626159668, -0.02591848373413086, -0.02519822120666504, -0.02447795867919922, -0.0237576961517334, -0.023037433624267578, -0.022317171096801758, -0.021596908569335938, -0.020876646041870117, -0.020156383514404297, -0.019436120986938477, -0.018715858459472656, -0.017995595932006836, -0.017275333404541016, -0.016555070877075195, -0.015834808349609375, -0.015114545822143555, -0.014394283294677734, -0.013674020767211914, -0.012953758239746094, -0.012233495712280273, -0.011513233184814453, -0.010792970657348633, -0.010072708129882812, -0.009352445602416992, -0.008632183074951172, -0.007911920547485352, -0.007191658020019531, -0.006471395492553711, -0.005751132965087891, -0.00503087043762207, -0.00431060791015625, -0.0035903453826904297, -0.0028700828552246094, -0.002149820327758789, -0.0014295578002929688, -0.0007092952728271484, 1.0967254638671875e-05, 0.0007312297821044922, 0.0014514923095703125, 0.002171754837036133, 0.002892017364501953, 0.0036122798919677734, 0.004332542419433594, 0.005052804946899414, 0.005773067474365234, 0.006493330001831055, 0.007213592529296875, 0.007933855056762695, 0.008654117584228516, 0.009374380111694336, 0.010094642639160156, 0.010814905166625977, 0.011535167694091797, 0.012255430221557617, 0.012975692749023438, 0.013695955276489258, 0.014416217803955078, 0.015136480331420898, 0.01585674285888672, 0.01657700538635254, 0.01729726791381836, 0.01801753044128418, 0.01873779296875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 45.0, 174.0, 339.0, 338.0, 91.0, 15.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.02313232421875, -0.022591829299926758, -0.022051334381103516, -0.021510839462280273, -0.02097034454345703, -0.02042984962463379, -0.019889354705810547, -0.019348859786987305, -0.018808364868164062, -0.01826786994934082, -0.017727375030517578, -0.017186880111694336, -0.016646385192871094, -0.01610589027404785, -0.01556539535522461, -0.015024900436401367, -0.014484405517578125, -0.013943910598754883, -0.01340341567993164, -0.012862920761108398, -0.012322425842285156, -0.011781930923461914, -0.011241436004638672, -0.01070094108581543, -0.010160446166992188, -0.009619951248168945, -0.009079456329345703, -0.008538961410522461, -0.007998466491699219, -0.0074579715728759766, -0.006917476654052734, -0.006376981735229492, -0.00583648681640625, -0.005295991897583008, -0.004755496978759766, -0.0042150020599365234, -0.0036745071411132812, -0.003134012222290039, -0.002593517303466797, -0.0020530223846435547, -0.0015125274658203125, -0.0009720325469970703, -0.0004315376281738281, 0.00010895729064941406, 0.0006494522094726562, 0.0011899471282958984, 0.0017304420471191406, 0.002270936965942383, 0.002811431884765625, 0.003351926803588867, 0.0038924217224121094, 0.0044329166412353516, 0.004973411560058594, 0.005513906478881836, 0.006054401397705078, 0.00659489631652832, 0.0071353912353515625, 0.007675886154174805, 0.008216381072998047, 0.008756875991821289, 0.009297370910644531, 0.009837865829467773, 0.010378360748291016, 0.010918855667114258, 0.0114593505859375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 4.0, 11.0, 17.0, 23.0, 36.0, 56.0, 113.0, 198.0, 442.0, 1076.0, 3259.0, 16633.0, 243524.0, 3805792.0, 108028.0, 10823.0, 2507.0, 947.0, 379.0, 181.0, 87.0, 57.0, 30.0, 19.0, 14.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.01293182373046875, -0.01262664794921875, -0.01232147216796875, -0.01201629638671875, -0.01171112060546875, -0.01140594482421875, -0.01110076904296875, -0.01079559326171875, -0.01049041748046875, -0.01018524169921875, -0.00988006591796875, -0.00957489013671875, -0.00926971435546875, -0.00896453857421875, -0.00865936279296875, -0.00835418701171875, -0.00804901123046875, -0.00774383544921875, -0.00743865966796875, -0.00713348388671875, -0.00682830810546875, -0.00652313232421875, -0.00621795654296875, -0.00591278076171875, -0.00560760498046875, -0.00530242919921875, -0.00499725341796875, -0.00469207763671875, -0.00438690185546875, -0.00408172607421875, -0.00377655029296875, -0.00347137451171875, -0.00316619873046875, -0.00286102294921875, -0.00255584716796875, -0.00225067138671875, -0.00194549560546875, -0.00164031982421875, -0.00133514404296875, -0.00102996826171875, -0.00072479248046875, -0.00041961669921875, -0.00011444091796875, 0.00019073486328125, 0.00049591064453125, 0.00080108642578125, 0.00110626220703125, 0.00141143798828125, 0.00171661376953125, 0.00202178955078125, 0.00232696533203125, 0.00263214111328125, 0.00293731689453125, 0.00324249267578125, 0.00354766845703125, 0.00385284423828125, 0.00415802001953125, 0.00446319580078125, 0.00476837158203125, 0.00507354736328125, 0.00537872314453125, 0.00568389892578125, 0.00598907470703125, 0.00629425048828125, 0.00659942626953125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0, 5.0, 2.0, 1.0, 7.0, 3.0, 5.0, 10.0, 16.0, 36.0, 57.0, 73.0, 112.0, 222.0, 501.0, 1073.0, 924.0, 436.0, 180.0, 116.0, 77.0, 67.0, 47.0, 30.0, 17.0, 9.0, 11.0, 11.0, 5.0, 6.0, 1.0, 3.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003894805908203125, -0.0037445425987243652, -0.0035942792892456055, -0.0034440159797668457, -0.003293752670288086, -0.003143489360809326, -0.0029932260513305664, -0.0028429627418518066, -0.002692699432373047, -0.002542436122894287, -0.0023921728134155273, -0.0022419095039367676, -0.002091646194458008, -0.001941382884979248, -0.0017911195755004883, -0.0016408562660217285, -0.0014905929565429688, -0.001340329647064209, -0.0011900663375854492, -0.0010398030281066895, -0.0008895397186279297, -0.0007392764091491699, -0.0005890130996704102, -0.0004387497901916504, -0.0002884864807128906, -0.00013822317123413086, 1.2040138244628906e-05, 0.00016230344772338867, 0.00031256675720214844, 0.0004628300666809082, 0.000613093376159668, 0.0007633566856384277, 0.0009136199951171875, 0.0010638833045959473, 0.001214146614074707, 0.0013644099235534668, 0.0015146732330322266, 0.0016649365425109863, 0.001815199851989746, 0.001965463161468506, 0.0021157264709472656, 0.0022659897804260254, 0.002416253089904785, 0.002566516399383545, 0.0027167797088623047, 0.0028670430183410645, 0.0030173063278198242, 0.003167569637298584, 0.0033178329467773438, 0.0034680962562561035, 0.0036183595657348633, 0.003768622875213623, 0.003918886184692383, 0.004069149494171143, 0.004219412803649902, 0.004369676113128662, 0.004519939422607422, 0.004670202732086182, 0.004820466041564941, 0.004970729351043701, 0.005120992660522461, 0.005271255970001221, 0.0054215192794799805, 0.00557178258895874, 0.0057220458984375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 19.0, 130.0, 412.0, 307.0, 82.0, 34.0, 10.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04663003981113434, -0.04481848329305649, -0.043006930500268936, -0.041195373982191086, -0.039383821189403534, -0.037572264671325684, -0.03576070815324783, -0.03394915163516998, -0.03213759884238243, -0.03032604418694973, -0.02851448953151703, -0.02670293301343918, -0.024891378358006477, -0.023079823702573776, -0.021268267184495926, -0.019456712529063225, -0.017645157873630524, -0.015833603218197823, -0.014022047631442547, -0.012210492044687271, -0.01039893738925457, -0.008587382733821869, -0.006775827147066593, -0.0049642715603113174, -0.0031527169048786163, -0.001341161783784628, 0.0004703933373093605, 0.002281948458403349, 0.004093503579497337, 0.0059050582349300385, 0.007716613821685314, 0.00952816940844059, 0.011339724063873291, 0.013151278719305992, 0.014962834306061268, 0.016774389892816544, 0.018585944548249245, 0.020397499203681946, 0.022209055721759796, 0.024020610377192497, 0.0258321650326252, 0.0276437196880579, 0.0294552743434906, 0.03126683086156845, 0.0330783873796463, 0.03488994017243385, 0.036701496690511703, 0.038513049483299255, 0.040324606001377106, 0.042136162519454956, 0.04394771531224251, 0.04575927183032036, 0.04757082462310791, 0.04938238114118576, 0.05119393765926361, 0.05300549417734146, 0.05481704697012901, 0.05662860348820686, 0.058440156280994415, 0.060251712799072266, 0.062063269317150116, 0.06387482583522797, 0.06568637490272522, 0.06749793142080307, 0.06930948793888092]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 5.0, 12.0, 18.0, 20.0, 25.0, 28.0, 45.0, 54.0, 75.0, 89.0, 74.0, 87.0, 74.0, 74.0, 66.0, 55.0, 69.0, 40.0, 35.0, 27.0, 16.0, 15.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.026328742504119873, -0.02565111592411995, -0.024973489344120026, -0.024295862764120102, -0.023618236184120178, -0.022940609604120255, -0.02226298302412033, -0.021585356444120407, -0.020907729864120483, -0.02023010328412056, -0.019552476704120636, -0.018874850124120712, -0.01819722354412079, -0.017519596964120865, -0.01684197038412094, -0.016164343804121017, -0.015486717224121094, -0.01480909064412117, -0.014131464064121246, -0.013453837484121323, -0.012776210904121399, -0.012098584324121475, -0.011420957744121552, -0.010743331164121628, -0.010065704584121704, -0.00938807800412178, -0.008710451424121857, -0.008032824844121933, -0.007355198264122009, -0.006677571684122086, -0.005999945104122162, -0.005322318524122238, -0.0046446919441223145, -0.003967065364122391, -0.003289438784122467, -0.0026118122041225433, -0.0019341856241226196, -0.001256559044122696, -0.0005789324641227722, 9.869411587715149e-05, 0.0007763206958770752, 0.001453947275876999, 0.0021315738558769226, 0.0028092004358768463, 0.00348682701587677, 0.004164453595876694, 0.004842080175876617, 0.005519706755876541, 0.006197333335876465, 0.0068749599158763885, 0.007552586495876312, 0.008230213075876236, 0.00890783965587616, 0.009585466235876083, 0.010263092815876007, 0.01094071939587593, 0.011618345975875854, 0.012295972555875778, 0.012973599135875702, 0.013651225715875626, 0.01432885229587555, 0.015006478875875473, 0.015684105455875397, 0.01636173203587532, 0.017039358615875244]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 6.0, 9.0, 16.0, 10.0, 21.0, 22.0, 30.0, 43.0, 59.0, 105.0, 127.0, 221.0, 302.0, 514.0, 918.0, 2758.0, 47026.0, 944146.0, 47177.0, 2655.0, 951.0, 490.0, 319.0, 187.0, 125.0, 80.0, 52.0, 52.0, 30.0, 24.0, 20.0, 14.0, 12.0, 9.0, 4.0, 5.0, 1.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186004638671875, -0.017924070358276367, -0.017247676849365234, -0.0165712833404541, -0.01589488983154297, -0.015218496322631836, -0.014542102813720703, -0.01386570930480957, -0.013189315795898438, -0.012512922286987305, -0.011836528778076172, -0.011160135269165039, -0.010483741760253906, -0.009807348251342773, -0.00913095474243164, -0.008454561233520508, -0.007778167724609375, -0.007101774215698242, -0.006425380706787109, -0.0057489871978759766, -0.005072593688964844, -0.004396200180053711, -0.003719806671142578, -0.0030434131622314453, -0.0023670196533203125, -0.0016906261444091797, -0.0010142326354980469, -0.00033783912658691406, 0.00033855438232421875, 0.0010149478912353516, 0.0016913414001464844, 0.002367734909057617, 0.00304412841796875, 0.003720521926879883, 0.004396915435791016, 0.0050733089447021484, 0.005749702453613281, 0.006426095962524414, 0.007102489471435547, 0.00777888298034668, 0.008455276489257812, 0.009131669998168945, 0.009808063507080078, 0.010484457015991211, 0.011160850524902344, 0.011837244033813477, 0.01251363754272461, 0.013190031051635742, 0.013866424560546875, 0.014542818069458008, 0.01521921157836914, 0.015895605087280273, 0.016571998596191406, 0.01724839210510254, 0.017924785614013672, 0.018601179122924805, 0.019277572631835938, 0.01995396614074707, 0.020630359649658203, 0.021306753158569336, 0.02198314666748047, 0.0226595401763916, 0.023335933685302734, 0.024012327194213867, 0.024688720703125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 45.0, 195.0, 352.0, 322.0, 72.0, 16.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0227813720703125, -0.02223527431488037, -0.021689176559448242, -0.021143078804016113, -0.020596981048583984, -0.020050883293151855, -0.019504785537719727, -0.018958687782287598, -0.01841259002685547, -0.01786649227142334, -0.01732039451599121, -0.016774296760559082, -0.016228199005126953, -0.015682101249694824, -0.015136003494262695, -0.014589905738830566, -0.014043807983398438, -0.013497710227966309, -0.01295161247253418, -0.01240551471710205, -0.011859416961669922, -0.011313319206237793, -0.010767221450805664, -0.010221123695373535, -0.009675025939941406, -0.009128928184509277, -0.008582830429077148, -0.00803673267364502, -0.007490634918212891, -0.006944537162780762, -0.006398439407348633, -0.005852341651916504, -0.005306243896484375, -0.004760146141052246, -0.004214048385620117, -0.0036679506301879883, -0.0031218528747558594, -0.0025757551193237305, -0.0020296573638916016, -0.0014835596084594727, -0.0009374618530273438, -0.00039136409759521484, 0.00015473365783691406, 0.000700831413269043, 0.0012469291687011719, 0.0017930269241333008, 0.0023391246795654297, 0.0028852224349975586, 0.0034313201904296875, 0.003977417945861816, 0.004523515701293945, 0.005069613456726074, 0.005615711212158203, 0.006161808967590332, 0.006707906723022461, 0.00725400447845459, 0.007800102233886719, 0.008346199989318848, 0.008892297744750977, 0.009438395500183105, 0.009984493255615234, 0.010530591011047363, 0.011076688766479492, 0.011622786521911621, 0.01216888427734375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 4.0, 6.0, 8.0, 16.0, 12.0, 15.0, 25.0, 21.0, 33.0, 44.0, 46.0, 86.0, 93.0, 164.0, 215.0, 353.0, 773.0, 2332.0, 9126.0, 48635.0, 279576.0, 533712.0, 141155.0, 24027.0, 5160.0, 1429.0, 542.0, 310.0, 174.0, 125.0, 65.0, 60.0, 43.0, 36.0, 29.0, 19.0, 17.0, 17.0, 10.0, 10.0, 6.0, 3.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007244110107421875, -0.007026553153991699, -0.0068089962005615234, -0.006591439247131348, -0.006373882293701172, -0.006156325340270996, -0.00593876838684082, -0.0057212114334106445, -0.005503654479980469, -0.005286097526550293, -0.005068540573120117, -0.004850983619689941, -0.004633426666259766, -0.00441586971282959, -0.004198312759399414, -0.003980755805969238, -0.0037631988525390625, -0.0035456418991088867, -0.003328084945678711, -0.003110527992248535, -0.0028929710388183594, -0.0026754140853881836, -0.002457857131958008, -0.002240300178527832, -0.0020227432250976562, -0.0018051862716674805, -0.0015876293182373047, -0.001370072364807129, -0.0011525154113769531, -0.0009349584579467773, -0.0007174015045166016, -0.0004998445510864258, -0.00028228759765625, -6.473064422607422e-05, 0.00015282630920410156, 0.00037038326263427734, 0.0005879402160644531, 0.0008054971694946289, 0.0010230541229248047, 0.0012406110763549805, 0.0014581680297851562, 0.001675724983215332, 0.0018932819366455078, 0.0021108388900756836, 0.0023283958435058594, 0.002545952796936035, 0.002763509750366211, 0.0029810667037963867, 0.0031986236572265625, 0.0034161806106567383, 0.003633737564086914, 0.00385129451751709, 0.004068851470947266, 0.004286408424377441, 0.004503965377807617, 0.004721522331237793, 0.004939079284667969, 0.0051566362380981445, 0.00537419319152832, 0.005591750144958496, 0.005809307098388672, 0.006026864051818848, 0.0062444210052490234, 0.006461977958679199, 0.006679534912109375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 5.0, 4.0, 12.0, 10.0, 10.0, 13.0, 9.0, 20.0, 15.0, 30.0, 24.0, 19.0, 27.0, 25.0, 37.0, 36.0, 47.0, 38.0, 46.0, 46.0, 41.0, 49.0, 41.0, 46.0, 37.0, 36.0, 35.0, 36.0, 38.0, 29.0, 15.0, 27.0, 14.0, 21.0, 13.0, 15.0, 10.0, 5.0, 7.0, 2.0, 2.0, 6.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005092620849609375, -0.00492250919342041, -0.004752397537231445, -0.0045822858810424805, -0.004412174224853516, -0.004242062568664551, -0.004071950912475586, -0.003901839256286621, -0.0037317276000976562, -0.0035616159439086914, -0.0033915042877197266, -0.0032213926315307617, -0.003051280975341797, -0.002881169319152832, -0.002711057662963867, -0.0025409460067749023, -0.0023708343505859375, -0.0022007226943969727, -0.002030611038208008, -0.001860499382019043, -0.0016903877258300781, -0.0015202760696411133, -0.0013501644134521484, -0.0011800527572631836, -0.0010099411010742188, -0.0008398294448852539, -0.0006697177886962891, -0.0004996061325073242, -0.0003294944763183594, -0.00015938282012939453, 1.0728836059570312e-05, 0.00018084049224853516, 0.0003509521484375, 0.0005210638046264648, 0.0006911754608154297, 0.0008612871170043945, 0.0010313987731933594, 0.0012015104293823242, 0.001371622085571289, 0.001541733741760254, 0.0017118453979492188, 0.0018819570541381836, 0.0020520687103271484, 0.0022221803665161133, 0.002392292022705078, 0.002562403678894043, 0.002732515335083008, 0.0029026269912719727, 0.0030727386474609375, 0.0032428503036499023, 0.003412961959838867, 0.003583073616027832, 0.003753185272216797, 0.003923296928405762, 0.0040934085845947266, 0.004263520240783691, 0.004433631896972656, 0.004603743553161621, 0.004773855209350586, 0.004943966865539551, 0.005114078521728516, 0.0052841901779174805, 0.005454301834106445, 0.00562441349029541, 0.005794525146484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 6.0, 7.0, 16.0, 14.0, 22.0, 32.0, 41.0, 41.0, 68.0, 107.0, 141.0, 210.0, 277.0, 422.0, 635.0, 929.0, 1347.0, 2179.0, 3582.0, 5966.0, 10430.0, 19969.0, 39119.0, 83860.0, 199422.0, 340674.0, 182041.0, 77403.0, 36101.0, 18268.0, 9938.0, 5686.0, 3384.0, 2100.0, 1288.0, 914.0, 561.0, 412.0, 255.0, 181.0, 145.0, 100.0, 73.0, 64.0, 39.0, 22.0, 14.0, 14.0, 16.0, 3.0, 4.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0], "bins": [-0.0013132095336914062, -0.001272737979888916, -0.0012322664260864258, -0.0011917948722839355, -0.0011513233184814453, -0.001110851764678955, -0.0010703802108764648, -0.0010299086570739746, -0.0009894371032714844, -0.0009489655494689941, -0.0009084939956665039, -0.0008680224418640137, -0.0008275508880615234, -0.0007870793342590332, -0.000746607780456543, -0.0007061362266540527, -0.0006656646728515625, -0.0006251931190490723, -0.000584721565246582, -0.0005442500114440918, -0.0005037784576416016, -0.00046330690383911133, -0.0004228353500366211, -0.00038236379623413086, -0.0003418922424316406, -0.0003014206886291504, -0.00026094913482666016, -0.00022047758102416992, -0.0001800060272216797, -0.00013953447341918945, -9.906291961669922e-05, -5.8591365814208984e-05, -1.811981201171875e-05, 2.2351741790771484e-05, 6.282329559326172e-05, 0.00010329484939575195, 0.0001437664031982422, 0.00018423795700073242, 0.00022470951080322266, 0.0002651810646057129, 0.0003056526184082031, 0.00034612417221069336, 0.0003865957260131836, 0.00042706727981567383, 0.00046753883361816406, 0.0005080103874206543, 0.0005484819412231445, 0.0005889534950256348, 0.000629425048828125, 0.0006698966026306152, 0.0007103681564331055, 0.0007508397102355957, 0.0007913112640380859, 0.0008317828178405762, 0.0008722543716430664, 0.0009127259254455566, 0.0009531974792480469, 0.0009936690330505371, 0.0010341405868530273, 0.0010746121406555176, 0.0011150836944580078, 0.001155555248260498, 0.0011960268020629883, 0.0012364983558654785, 0.0012769699096679688]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 9.0, 14.0, 26.0, 31.0, 50.0, 99.0, 134.0, 170.0, 165.0, 109.0, 66.0, 42.0, 31.0, 19.0, 8.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001671314239501953, -0.00016216188669204712, -0.00015719234943389893, -0.00015222281217575073, -0.00014725327491760254, -0.00014228373765945435, -0.00013731420040130615, -0.00013234466314315796, -0.00012737512588500977, -0.00012240558862686157, -0.00011743605136871338, -0.00011246651411056519, -0.00010749697685241699, -0.0001025274395942688, -9.75579023361206e-05, -9.258836507797241e-05, -8.761882781982422e-05, -8.264929056167603e-05, -7.767975330352783e-05, -7.271021604537964e-05, -6.774067878723145e-05, -6.277114152908325e-05, -5.780160427093506e-05, -5.2832067012786865e-05, -4.786252975463867e-05, -4.289299249649048e-05, -3.7923455238342285e-05, -3.295391798019409e-05, -2.79843807220459e-05, -2.3014843463897705e-05, -1.8045306205749512e-05, -1.3075768947601318e-05, -8.106231689453125e-06, -3.1366944313049316e-06, 1.8328428268432617e-06, 6.802380084991455e-06, 1.1771917343139648e-05, 1.6741454601287842e-05, 2.1710991859436035e-05, 2.668052911758423e-05, 3.165006637573242e-05, 3.6619603633880615e-05, 4.158914089202881e-05, 4.6558678150177e-05, 5.1528215408325195e-05, 5.649775266647339e-05, 6.146728992462158e-05, 6.643682718276978e-05, 7.140636444091797e-05, 7.637590169906616e-05, 8.134543895721436e-05, 8.631497621536255e-05, 9.128451347351074e-05, 9.625405073165894e-05, 0.00010122358798980713, 0.00010619312524795532, 0.00011116266250610352, 0.00011613219976425171, 0.0001211017370223999, 0.0001260712742805481, 0.0001310408115386963, 0.00013601034879684448, 0.00014097988605499268, 0.00014594942331314087, 0.00015091896057128906]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 8.0, 11.0, 9.0, 23.0, 36.0, 45.0, 67.0, 113.0, 168.0, 385.0, 687.0, 1662.0, 4026.0, 12706.0, 51703.0, 404945.0, 489941.0, 60117.0, 14084.0, 4390.0, 1761.0, 763.0, 364.0, 212.0, 123.0, 63.0, 54.0, 21.0, 20.0, 12.0, 11.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029430389404296875, -0.002825528383255005, -0.0027080178260803223, -0.0025905072689056396, -0.002472996711730957, -0.0023554861545562744, -0.002237975597381592, -0.002120465040206909, -0.0020029544830322266, -0.001885443925857544, -0.0017679333686828613, -0.0016504228115081787, -0.001532912254333496, -0.0014154016971588135, -0.0012978911399841309, -0.0011803805828094482, -0.0010628700256347656, -0.000945359468460083, -0.0008278489112854004, -0.0007103383541107178, -0.0005928277969360352, -0.00047531723976135254, -0.0003578066825866699, -0.0002402961254119873, -0.0001227855682373047, -5.27501106262207e-06, 0.00011223554611206055, 0.00022974610328674316, 0.0003472566604614258, 0.0004647672176361084, 0.000582277774810791, 0.0006997883319854736, 0.0008172988891601562, 0.0009348094463348389, 0.0010523200035095215, 0.001169830560684204, 0.0012873411178588867, 0.0014048516750335693, 0.001522362232208252, 0.0016398727893829346, 0.0017573833465576172, 0.0018748939037322998, 0.0019924044609069824, 0.002109915018081665, 0.0022274255752563477, 0.0023449361324310303, 0.002462446689605713, 0.0025799572467803955, 0.002697467803955078, 0.0028149783611297607, 0.0029324889183044434, 0.003049999475479126, 0.0031675100326538086, 0.003285020589828491, 0.003402531147003174, 0.0035200417041778564, 0.003637552261352539, 0.0037550628185272217, 0.0038725733757019043, 0.003990083932876587, 0.0041075944900512695, 0.004225105047225952, 0.004342615604400635, 0.004460126161575317, 0.00457763671875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 4.0, 7.0, 6.0, 10.0, 21.0, 18.0, 22.0, 46.0, 49.0, 94.0, 124.0, 125.0, 105.0, 94.0, 77.0, 52.0, 41.0, 29.0, 15.0, 13.0, 15.0, 11.0, 9.0, 7.0, 1.0, 4.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003387451171875, -0.003295302391052246, -0.003203153610229492, -0.0031110048294067383, -0.0030188560485839844, -0.0029267072677612305, -0.0028345584869384766, -0.0027424097061157227, -0.0026502609252929688, -0.002558112144470215, -0.002465963363647461, -0.002373814582824707, -0.002281665802001953, -0.0021895170211791992, -0.0020973682403564453, -0.0020052194595336914, -0.0019130706787109375, -0.0018209218978881836, -0.0017287731170654297, -0.0016366243362426758, -0.0015444755554199219, -0.001452326774597168, -0.001360177993774414, -0.0012680292129516602, -0.0011758804321289062, -0.0010837316513061523, -0.0009915828704833984, -0.0008994340896606445, -0.0008072853088378906, -0.0007151365280151367, -0.0006229877471923828, -0.0005308389663696289, -0.000438690185546875, -0.0003465414047241211, -0.0002543926239013672, -0.00016224384307861328, -7.009506225585938e-05, 2.205371856689453e-05, 0.00011420249938964844, 0.00020635128021240234, 0.00029850006103515625, 0.00039064884185791016, 0.00048279762268066406, 0.000574946403503418, 0.0006670951843261719, 0.0007592439651489258, 0.0008513927459716797, 0.0009435415267944336, 0.0010356903076171875, 0.0011278390884399414, 0.0012199878692626953, 0.0013121366500854492, 0.0014042854309082031, 0.001496434211730957, 0.001588582992553711, 0.0016807317733764648, 0.0017728805541992188, 0.0018650293350219727, 0.0019571781158447266, 0.0020493268966674805, 0.0021414756774902344, 0.0022336244583129883, 0.002325773239135742, 0.002417922019958496, 0.00251007080078125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 15.0, 950.0, 50.0, 4.0], "bins": [-0.5758289694786072, -0.5664706826210022, -0.5571123957633972, -0.5477541089057922, -0.538395881652832, -0.529037594795227, -0.5196793079376221, -0.5103210210800171, -0.5009627342224121, -0.49160444736480713, -0.48224619030952454, -0.47288790345191956, -0.4635296165943146, -0.4541713297367096, -0.444813072681427, -0.435454785823822, -0.42609649896621704, -0.41673821210861206, -0.40737995505332947, -0.3980216681957245, -0.3886633813381195, -0.3793050944805145, -0.36994683742523193, -0.36058855056762695, -0.35123029351234436, -0.3418720066547394, -0.3325137495994568, -0.3231554627418518, -0.3137971758842468, -0.30443888902664185, -0.29508063197135925, -0.2857223451137543, -0.2763640582561493, -0.2670057713985443, -0.2576475143432617, -0.24828922748565674, -0.23893094062805176, -0.22957266867160797, -0.22021439671516418, -0.2108561098575592, -0.20149783790111542, -0.19213956594467163, -0.18278127908706665, -0.17342300713062286, -0.16406472027301788, -0.1547064483165741, -0.14534816145896912, -0.13598988950252533, -0.12663160264492035, -0.11727332323789597, -0.10791504383087158, -0.0985567718744278, -0.08919848501682281, -0.07984021306037903, -0.07048193365335464, -0.06112365424633026, -0.051765378564596176, -0.04240709915757179, -0.03304882347583771, -0.023690544068813324, -0.01433226466178894, -0.004973985254764557, 0.004384290426969528, 0.013742569833993912, 0.023100849241018295]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 6.0, 11.0, 12.0, 13.0, 17.0, 18.0, 22.0, 23.0, 36.0, 38.0, 35.0, 44.0, 52.0, 48.0, 50.0, 38.0, 46.0, 46.0, 59.0, 54.0, 44.0, 39.0, 41.0, 38.0, 35.0, 20.0, 24.0, 15.0, 15.0, 17.0, 14.0, 6.0, 8.0, 4.0, 1.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01751530170440674, -0.01694650948047638, -0.01637771539390087, -0.015808921307325363, -0.015240129083395004, -0.01467133592814207, -0.014102542772889137, -0.013533749617636204, -0.01296495646238327, -0.012396163307130337, -0.011827370151877403, -0.01125857699662447, -0.010689783841371536, -0.010120990686118603, -0.00955219753086567, -0.008983404375612736, -0.008414611220359802, -0.007845818065106869, -0.007277024909853935, -0.006708231754601002, -0.006139438599348068, -0.005570645444095135, -0.005001852288842201, -0.004433059133589268, -0.0038642659783363342, -0.0032954728230834007, -0.0027266796678304672, -0.0021578865125775337, -0.0015890933573246002, -0.0010203002020716667, -0.0004515070468187332, 0.00011728610843420029, 0.0006860792636871338, 0.0012548724189400673, 0.0018236655741930008, 0.0023924587294459343, 0.002961251884698868, 0.0035300450399518013, 0.004098838195204735, 0.004667631350457668, 0.005236424505710602, 0.005805217660963535, 0.006374010816216469, 0.006942803971469402, 0.007511597126722336, 0.00808039028197527, 0.008649183437228203, 0.009217976592481136, 0.00978676974773407, 0.010355562902987003, 0.010924356058239937, 0.01149314921349287, 0.012061942368745804, 0.012630735523998737, 0.01319952867925167, 0.013768321834504604, 0.014337114989757538, 0.014905908145010471, 0.015474701300263405, 0.016043495386838913, 0.016612287610769272, 0.01718107983469963, 0.01774987392127514, 0.018318668007850647, 0.018887460231781006]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 4.0, 4.0, 5.0, 8.0, 6.0, 12.0, 12.0, 21.0, 22.0, 30.0, 55.0, 64.0, 107.0, 181.0, 470.0, 5237.0, 3882683.0, 300423.0, 3313.0, 992.0, 415.0, 92.0, 36.0, 21.0, 23.0, 10.0, 8.0, 5.0, 5.0, 8.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03399658203125, -0.03312277793884277, -0.03224897384643555, -0.03137516975402832, -0.030501365661621094, -0.029627561569213867, -0.02875375747680664, -0.027879953384399414, -0.027006149291992188, -0.02613234519958496, -0.025258541107177734, -0.024384737014770508, -0.02351093292236328, -0.022637128829956055, -0.021763324737548828, -0.0208895206451416, -0.020015716552734375, -0.01914191246032715, -0.018268108367919922, -0.017394304275512695, -0.01652050018310547, -0.015646696090698242, -0.014772891998291016, -0.013899087905883789, -0.013025283813476562, -0.012151479721069336, -0.01127767562866211, -0.010403871536254883, -0.009530067443847656, -0.00865626335144043, -0.007782459259033203, -0.0069086551666259766, -0.00603485107421875, -0.0051610469818115234, -0.004287242889404297, -0.0034134387969970703, -0.0025396347045898438, -0.0016658306121826172, -0.0007920265197753906, 8.177757263183594e-05, 0.0009555816650390625, 0.001829385757446289, 0.0027031898498535156, 0.003576993942260742, 0.004450798034667969, 0.005324602127075195, 0.006198406219482422, 0.0070722103118896484, 0.007946014404296875, 0.008819818496704102, 0.009693622589111328, 0.010567426681518555, 0.011441230773925781, 0.012315034866333008, 0.013188838958740234, 0.014062643051147461, 0.014936447143554688, 0.015810251235961914, 0.01668405532836914, 0.017557859420776367, 0.018431663513183594, 0.01930546760559082, 0.020179271697998047, 0.021053075790405273, 0.0219268798828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 31.0, 165.0, 366.0, 324.0, 98.0, 19.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0231781005859375, -0.022636890411376953, -0.022095680236816406, -0.02155447006225586, -0.021013259887695312, -0.020472049713134766, -0.01993083953857422, -0.019389629364013672, -0.018848419189453125, -0.018307209014892578, -0.01776599884033203, -0.017224788665771484, -0.016683578491210938, -0.01614236831665039, -0.015601158142089844, -0.015059947967529297, -0.01451873779296875, -0.013977527618408203, -0.013436317443847656, -0.01289510726928711, -0.012353897094726562, -0.011812686920166016, -0.011271476745605469, -0.010730266571044922, -0.010189056396484375, -0.009647846221923828, -0.009106636047363281, -0.008565425872802734, -0.008024215698242188, -0.007483005523681641, -0.006941795349121094, -0.006400585174560547, -0.005859375, -0.005318164825439453, -0.004776954650878906, -0.004235744476318359, -0.0036945343017578125, -0.0031533241271972656, -0.0026121139526367188, -0.002070903778076172, -0.001529693603515625, -0.0009884834289550781, -0.00044727325439453125, 9.393692016601562e-05, 0.0006351470947265625, 0.0011763572692871094, 0.0017175674438476562, 0.002258777618408203, 0.00279998779296875, 0.003341197967529297, 0.0038824081420898438, 0.004423618316650391, 0.0049648284912109375, 0.005506038665771484, 0.006047248840332031, 0.006588459014892578, 0.007129669189453125, 0.007670879364013672, 0.008212089538574219, 0.008753299713134766, 0.009294509887695312, 0.00983572006225586, 0.010376930236816406, 0.010918140411376953, 0.0114593505859375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 5.0, 13.0, 35.0, 38.0, 68.0, 120.0, 216.0, 451.0, 934.0, 2519.0, 7769.0, 33012.0, 244861.0, 3681055.0, 184159.0, 27966.0, 6923.0, 2222.0, 938.0, 466.0, 217.0, 128.0, 65.0, 37.0, 22.0, 16.0, 6.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005420684814453125, -0.005248308181762695, -0.005075931549072266, -0.004903554916381836, -0.004731178283691406, -0.0045588016510009766, -0.004386425018310547, -0.004214048385620117, -0.0040416717529296875, -0.003869295120239258, -0.003696918487548828, -0.0035245418548583984, -0.0033521652221679688, -0.003179788589477539, -0.0030074119567871094, -0.0028350353240966797, -0.00266265869140625, -0.0024902820587158203, -0.0023179054260253906, -0.002145528793334961, -0.0019731521606445312, -0.0018007755279541016, -0.0016283988952636719, -0.0014560222625732422, -0.0012836456298828125, -0.0011112689971923828, -0.0009388923645019531, -0.0007665157318115234, -0.0005941390991210938, -0.00042176246643066406, -0.0002493858337402344, -7.700920104980469e-05, 9.5367431640625e-05, 0.0002677440643310547, 0.0004401206970214844, 0.0006124973297119141, 0.0007848739624023438, 0.0009572505950927734, 0.0011296272277832031, 0.0013020038604736328, 0.0014743804931640625, 0.0016467571258544922, 0.0018191337585449219, 0.0019915103912353516, 0.0021638870239257812, 0.002336263656616211, 0.0025086402893066406, 0.0026810169219970703, 0.0028533935546875, 0.0030257701873779297, 0.0031981468200683594, 0.003370523452758789, 0.0035429000854492188, 0.0037152767181396484, 0.003887653350830078, 0.004060029983520508, 0.0042324066162109375, 0.004404783248901367, 0.004577159881591797, 0.0047495365142822266, 0.004921913146972656, 0.005094289779663086, 0.005266666412353516, 0.005439043045043945, 0.005611419677734375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 4.0, 4.0, 11.0, 15.0, 11.0, 19.0, 19.0, 38.0, 44.0, 86.0, 165.0, 339.0, 908.0, 1360.0, 514.0, 202.0, 108.0, 58.0, 40.0, 36.0, 23.0, 20.0, 17.0, 11.0, 8.0, 4.0, 1.0, 3.0, 6.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031948089599609375, -0.003085494041442871, -0.0029761791229248047, -0.0028668642044067383, -0.002757549285888672, -0.0026482343673706055, -0.002538919448852539, -0.0024296045303344727, -0.0023202896118164062, -0.00221097469329834, -0.0021016597747802734, -0.001992344856262207, -0.0018830299377441406, -0.0017737150192260742, -0.0016644001007080078, -0.0015550851821899414, -0.001445770263671875, -0.0013364553451538086, -0.0012271404266357422, -0.0011178255081176758, -0.0010085105895996094, -0.000899195671081543, -0.0007898807525634766, -0.0006805658340454102, -0.0005712509155273438, -0.00046193599700927734, -0.00035262107849121094, -0.00024330615997314453, -0.00013399124145507812, -2.467632293701172e-05, 8.463859558105469e-05, 0.0001939535140991211, 0.0003032684326171875, 0.0004125833511352539, 0.0005218982696533203, 0.0006312131881713867, 0.0007405281066894531, 0.0008498430252075195, 0.0009591579437255859, 0.0010684728622436523, 0.0011777877807617188, 0.0012871026992797852, 0.0013964176177978516, 0.001505732536315918, 0.0016150474548339844, 0.0017243623733520508, 0.0018336772918701172, 0.0019429922103881836, 0.00205230712890625, 0.0021616220474243164, 0.002270936965942383, 0.0023802518844604492, 0.0024895668029785156, 0.002598881721496582, 0.0027081966400146484, 0.002817511558532715, 0.0029268264770507812, 0.0030361413955688477, 0.003145456314086914, 0.0032547712326049805, 0.003364086151123047, 0.0034734010696411133, 0.0035827159881591797, 0.003692030906677246, 0.0038013458251953125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 21.0, 166.0, 591.0, 203.0, 18.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08301292359828949, -0.08118685334920883, -0.07936078310012817, -0.07753471285104752, -0.07570864260196686, -0.0738825798034668, -0.07205650955438614, -0.07023043930530548, -0.06840436905622482, -0.06657829880714417, -0.06475222855806351, -0.06292615830898285, -0.06110009178519249, -0.05927402153611183, -0.05744795501232147, -0.055621884763240814, -0.053795814514160156, -0.0519697442650795, -0.05014367401599884, -0.04831760749220848, -0.04649153724312782, -0.044665466994047165, -0.042839400470256805, -0.04101333022117615, -0.03918725997209549, -0.03736118972301483, -0.035535119473934174, -0.033709052950143814, -0.031882982701063156, -0.030056912451982498, -0.02823084406554699, -0.02640477567911148, -0.02457870915532112, -0.022752638906240463, -0.020926570519804955, -0.019100502133369446, -0.017274431884288788, -0.015448362566530704, -0.013622293248772621, -0.011796223931014538, -0.009970154613256454, -0.008144085295498371, -0.006318015977740288, -0.0044919466599822044, -0.002665877342224121, -0.0008398080244660378, 0.0009862612932920456, 0.002812330611050129, 0.004638399928808212, 0.006464469246566296, 0.008290538564324379, 0.010116607882082462, 0.011942677199840546, 0.013768746517598629, 0.015594815835356712, 0.01742088422179222, 0.01924695447087288, 0.021073024719953537, 0.022899093106389046, 0.024725161492824554, 0.026551231741905212, 0.02837730199098587, 0.03020337037742138, 0.03202943876385689, 0.033855509012937546]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 7.0, 5.0, 9.0, 11.0, 9.0, 17.0, 23.0, 37.0, 34.0, 42.0, 50.0, 56.0, 46.0, 67.0, 67.0, 67.0, 58.0, 57.0, 52.0, 55.0, 49.0, 43.0, 32.0, 27.0, 22.0, 22.0, 15.0, 7.0, 7.0, 8.0, 1.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011877834796905518, -0.011559507809579372, -0.011241180822253227, -0.010922853834927082, -0.010604526847600937, -0.010286199860274792, -0.009967872872948647, -0.009649545885622501, -0.009331218898296356, -0.009012891910970211, -0.008694564923644066, -0.00837623793631792, -0.008057910948991776, -0.00773958396166563, -0.007421256974339485, -0.00710292998701334, -0.006784602999687195, -0.00646627601236105, -0.0061479490250349045, -0.005829622037708759, -0.005511295050382614, -0.005192968063056469, -0.004874641075730324, -0.004556314088404179, -0.0042379871010780334, -0.003919660113751888, -0.003601333126425743, -0.003283006139099598, -0.0029646791517734528, -0.0026463521644473076, -0.0023280251771211624, -0.0020096981897950172, -0.001691371202468872, -0.001373044215142727, -0.0010547172278165817, -0.0007363902404904366, -0.0004180632531642914, -9.973626583814621e-05, 0.00021859072148799896, 0.0005369177088141441, 0.0008552446961402893, 0.0011735716834664345, 0.0014918986707925797, 0.0018102256581187248, 0.00212855264544487, 0.002446879632771015, 0.0027652066200971603, 0.0030835336074233055, 0.0034018605947494507, 0.003720187582075596, 0.004038514569401741, 0.004356841556727886, 0.004675168544054031, 0.0049934955313801765, 0.005311822518706322, 0.005630149506032467, 0.005948476493358612, 0.006266803480684757, 0.006585130468010902, 0.006903457455337048, 0.007221784442663193, 0.007540111429989338, 0.007858438417315483, 0.008176765404641628, 0.008495092391967773]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 4.0, 5.0, 8.0, 11.0, 10.0, 17.0, 27.0, 18.0, 31.0, 41.0, 58.0, 94.0, 143.0, 191.0, 268.0, 405.0, 692.0, 1301.0, 4394.0, 139196.0, 870810.0, 25771.0, 2342.0, 928.0, 584.0, 354.0, 238.0, 172.0, 116.0, 88.0, 74.0, 35.0, 23.0, 32.0, 16.0, 15.0, 13.0, 12.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.01715087890625, -0.016678452491760254, -0.016206026077270508, -0.01573359966278076, -0.015261173248291016, -0.01478874683380127, -0.014316320419311523, -0.013843894004821777, -0.013371467590332031, -0.012899041175842285, -0.012426614761352539, -0.011954188346862793, -0.011481761932373047, -0.0110093355178833, -0.010536909103393555, -0.010064482688903809, -0.009592056274414062, -0.009119629859924316, -0.00864720344543457, -0.008174777030944824, -0.007702350616455078, -0.007229924201965332, -0.006757497787475586, -0.00628507137298584, -0.005812644958496094, -0.005340218544006348, -0.0048677921295166016, -0.0043953657150268555, -0.003922939300537109, -0.0034505128860473633, -0.002978086471557617, -0.002505660057067871, -0.002033233642578125, -0.001560807228088379, -0.0010883808135986328, -0.0006159543991088867, -0.00014352798461914062, 0.00032889842987060547, 0.0008013248443603516, 0.0012737512588500977, 0.0017461776733398438, 0.00221860408782959, 0.002691030502319336, 0.003163456916809082, 0.003635883331298828, 0.004108309745788574, 0.00458073616027832, 0.005053162574768066, 0.0055255889892578125, 0.005998015403747559, 0.006470441818237305, 0.006942868232727051, 0.007415294647216797, 0.007887721061706543, 0.008360147476196289, 0.008832573890686035, 0.009305000305175781, 0.009777426719665527, 0.010249853134155273, 0.01072227954864502, 0.011194705963134766, 0.011667132377624512, 0.012139558792114258, 0.012611985206604004, 0.01308441162109375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 8.0, 71.0, 252.0, 395.0, 223.0, 53.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.023193359375, -0.022646546363830566, -0.022099733352661133, -0.0215529203414917, -0.021006107330322266, -0.020459294319152832, -0.0199124813079834, -0.019365668296813965, -0.01881885528564453, -0.018272042274475098, -0.017725229263305664, -0.01717841625213623, -0.016631603240966797, -0.016084790229797363, -0.01553797721862793, -0.014991164207458496, -0.014444351196289062, -0.013897538185119629, -0.013350725173950195, -0.012803912162780762, -0.012257099151611328, -0.011710286140441895, -0.011163473129272461, -0.010616660118103027, -0.010069847106933594, -0.00952303409576416, -0.008976221084594727, -0.008429408073425293, -0.00788259506225586, -0.007335782051086426, -0.006788969039916992, -0.006242156028747559, -0.005695343017578125, -0.005148530006408691, -0.004601716995239258, -0.004054903984069824, -0.0035080909729003906, -0.002961277961730957, -0.0024144649505615234, -0.0018676519393920898, -0.0013208389282226562, -0.0007740259170532227, -0.00022721290588378906, 0.00031960010528564453, 0.0008664131164550781, 0.0014132261276245117, 0.0019600391387939453, 0.002506852149963379, 0.0030536651611328125, 0.003600478172302246, 0.00414729118347168, 0.004694104194641113, 0.005240917205810547, 0.0057877302169799805, 0.006334543228149414, 0.006881356239318848, 0.007428169250488281, 0.007974982261657715, 0.008521795272827148, 0.009068608283996582, 0.009615421295166016, 0.01016223430633545, 0.010709047317504883, 0.011255860328674316, 0.01180267333984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 3.0, 4.0, 4.0, 3.0, 5.0, 6.0, 12.0, 12.0, 15.0, 13.0, 15.0, 29.0, 28.0, 23.0, 43.0, 53.0, 94.0, 106.0, 151.0, 265.0, 545.0, 1761.0, 8412.0, 66277.0, 528779.0, 391826.0, 41621.0, 5820.0, 1349.0, 502.0, 203.0, 154.0, 107.0, 73.0, 62.0, 43.0, 24.0, 26.0, 27.0, 10.0, 17.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.007556915283203125, -0.007333993911743164, -0.007111072540283203, -0.006888151168823242, -0.006665229797363281, -0.00644230842590332, -0.006219387054443359, -0.0059964656829833984, -0.0057735443115234375, -0.0055506229400634766, -0.005327701568603516, -0.005104780197143555, -0.004881858825683594, -0.004658937454223633, -0.004436016082763672, -0.004213094711303711, -0.00399017333984375, -0.003767251968383789, -0.003544330596923828, -0.003321409225463867, -0.0030984878540039062, -0.0028755664825439453, -0.0026526451110839844, -0.0024297237396240234, -0.0022068023681640625, -0.0019838809967041016, -0.0017609596252441406, -0.0015380382537841797, -0.0013151168823242188, -0.0010921955108642578, -0.0008692741394042969, -0.0006463527679443359, -0.000423431396484375, -0.00020051002502441406, 2.2411346435546875e-05, 0.0002453327178955078, 0.00046825408935546875, 0.0006911754608154297, 0.0009140968322753906, 0.0011370182037353516, 0.0013599395751953125, 0.0015828609466552734, 0.0018057823181152344, 0.0020287036895751953, 0.0022516250610351562, 0.002474546432495117, 0.002697467803955078, 0.002920389175415039, 0.003143310546875, 0.003366231918334961, 0.003589153289794922, 0.003812074661254883, 0.004034996032714844, 0.004257917404174805, 0.004480838775634766, 0.0047037601470947266, 0.0049266815185546875, 0.0051496028900146484, 0.005372524261474609, 0.00559544563293457, 0.005818367004394531, 0.006041288375854492, 0.006264209747314453, 0.006487131118774414, 0.006710052490234375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 0.0, 5.0, 4.0, 4.0, 6.0, 6.0, 10.0, 13.0, 10.0, 12.0, 13.0, 24.0, 28.0, 27.0, 35.0, 38.0, 32.0, 27.0, 43.0, 50.0, 36.0, 43.0, 44.0, 52.0, 32.0, 49.0, 56.0, 36.0, 35.0, 34.0, 26.0, 24.0, 18.0, 27.0, 11.0, 16.0, 8.0, 7.0, 10.0, 14.0, 8.0, 10.0, 6.0, 1.0, 3.0, 6.0, 2.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.004970550537109375, -0.004811286926269531, -0.0046520233154296875, -0.004492759704589844, -0.00433349609375, -0.004174232482910156, -0.0040149688720703125, -0.0038557052612304688, -0.003696441650390625, -0.0035371780395507812, -0.0033779144287109375, -0.0032186508178710938, -0.00305938720703125, -0.0029001235961914062, -0.0027408599853515625, -0.0025815963745117188, -0.002422332763671875, -0.0022630691528320312, -0.0021038055419921875, -0.0019445419311523438, -0.0017852783203125, -0.0016260147094726562, -0.0014667510986328125, -0.0013074874877929688, -0.001148223876953125, -0.0009889602661132812, -0.0008296966552734375, -0.0006704330444335938, -0.00051116943359375, -0.00035190582275390625, -0.0001926422119140625, -3.337860107421875e-05, 0.000125885009765625, 0.00028514862060546875, 0.0004444122314453125, 0.0006036758422851562, 0.000762939453125, 0.0009222030639648438, 0.0010814666748046875, 0.0012407302856445312, 0.001399993896484375, 0.0015592575073242188, 0.0017185211181640625, 0.0018777847290039062, 0.00203704833984375, 0.0021963119506835938, 0.0023555755615234375, 0.0025148391723632812, 0.002674102783203125, 0.0028333663940429688, 0.0029926300048828125, 0.0031518936157226562, 0.0033111572265625, 0.0034704208374023438, 0.0036296844482421875, 0.0037889480590820312, 0.003948211669921875, 0.004107475280761719, 0.0042667388916015625, 0.004426002502441406, 0.00458526611328125, 0.004744529724121094, 0.0049037933349609375, 0.005063056945800781, 0.005222320556640625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 0.0, 2.0, 4.0, 12.0, 8.0, 8.0, 15.0, 14.0, 22.0, 21.0, 40.0, 59.0, 75.0, 146.0, 212.0, 488.0, 965.0, 2112.0, 4623.0, 11144.0, 30216.0, 100203.0, 421518.0, 351444.0, 81782.0, 25816.0, 9766.0, 4083.0, 1847.0, 875.0, 420.0, 219.0, 128.0, 74.0, 55.0, 35.0, 31.0, 21.0, 12.0, 9.0, 9.0, 8.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014781951904296875, -0.0014287978410720825, -0.0013794004917144775, -0.0013300031423568726, -0.0012806057929992676, -0.0012312084436416626, -0.0011818110942840576, -0.0011324137449264526, -0.0010830163955688477, -0.0010336190462112427, -0.0009842216968536377, -0.0009348243474960327, -0.0008854269981384277, -0.0008360296487808228, -0.0007866322994232178, -0.0007372349500656128, -0.0006878376007080078, -0.0006384402513504028, -0.0005890429019927979, -0.0005396455526351929, -0.0004902482032775879, -0.0004408508539199829, -0.00039145350456237793, -0.00034205615520477295, -0.00029265880584716797, -0.000243261456489563, -0.000193864107131958, -0.00014446675777435303, -9.506940841674805e-05, -4.5672059059143066e-05, 3.725290298461914e-06, 5.3122639656066895e-05, 0.00010251998901367188, 0.00015191733837127686, 0.00020131468772888184, 0.0002507120370864868, 0.0003001093864440918, 0.0003495067358016968, 0.00039890408515930176, 0.00044830143451690674, 0.0004976987838745117, 0.0005470961332321167, 0.0005964934825897217, 0.0006458908319473267, 0.0006952881813049316, 0.0007446855306625366, 0.0007940828800201416, 0.0008434802293777466, 0.0008928775787353516, 0.0009422749280929565, 0.0009916722774505615, 0.0010410696268081665, 0.0010904669761657715, 0.0011398643255233765, 0.0011892616748809814, 0.0012386590242385864, 0.0012880563735961914, 0.0013374537229537964, 0.0013868510723114014, 0.0014362484216690063, 0.0014856457710266113, 0.0015350431203842163, 0.0015844404697418213, 0.0016338378190994263, 0.0016832351684570312]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 9.0, 7.0, 15.0, 7.0, 22.0, 31.0, 44.0, 46.0, 78.0, 94.0, 90.0, 123.0, 94.0, 80.0, 65.0, 60.0, 31.0, 25.0, 14.0, 12.0, 6.0, 10.0, 6.0, 6.0, 2.0, 10.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.189678192138672e-05, -7.852166891098022e-05, -7.514655590057373e-05, -7.177144289016724e-05, -6.839632987976074e-05, -6.502121686935425e-05, -6.164610385894775e-05, -5.827099084854126e-05, -5.4895877838134766e-05, -5.152076482772827e-05, -4.814565181732178e-05, -4.477053880691528e-05, -4.139542579650879e-05, -3.8020312786102295e-05, -3.46451997756958e-05, -3.127008676528931e-05, -2.7894973754882812e-05, -2.451986074447632e-05, -2.1144747734069824e-05, -1.776963472366333e-05, -1.4394521713256836e-05, -1.1019408702850342e-05, -7.644295692443848e-06, -4.2691826820373535e-06, -8.940696716308594e-07, 2.4810433387756348e-06, 5.856156349182129e-06, 9.231269359588623e-06, 1.2606382369995117e-05, 1.598149538040161e-05, 1.9356608390808105e-05, 2.27317214012146e-05, 2.6106834411621094e-05, 2.9481947422027588e-05, 3.285706043243408e-05, 3.6232173442840576e-05, 3.960728645324707e-05, 4.2982399463653564e-05, 4.635751247406006e-05, 4.973262548446655e-05, 5.310773849487305e-05, 5.648285150527954e-05, 5.9857964515686035e-05, 6.323307752609253e-05, 6.660819053649902e-05, 6.998330354690552e-05, 7.335841655731201e-05, 7.67335295677185e-05, 8.0108642578125e-05, 8.34837555885315e-05, 8.685886859893799e-05, 9.023398160934448e-05, 9.360909461975098e-05, 9.698420763015747e-05, 0.00010035932064056396, 0.00010373443365097046, 0.00010710954666137695, 0.00011048465967178345, 0.00011385977268218994, 0.00011723488569259644, 0.00012060999870300293, 0.00012398511171340942, 0.00012736022472381592, 0.0001307353377342224, 0.0001341104507446289]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 6.0, 11.0, 5.0, 13.0, 17.0, 25.0, 30.0, 48.0, 74.0, 122.0, 197.0, 385.0, 822.0, 1953.0, 6047.0, 22535.0, 127655.0, 685929.0, 164795.0, 26908.0, 6839.0, 2306.0, 875.0, 404.0, 210.0, 125.0, 75.0, 38.0, 33.0, 32.0, 15.0, 5.0, 12.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026111602783203125, -0.0025228261947631836, -0.0024344921112060547, -0.0023461580276489258, -0.002257823944091797, -0.002169489860534668, -0.002081155776977539, -0.00199282169342041, -0.0019044876098632812, -0.0018161535263061523, -0.0017278194427490234, -0.0016394853591918945, -0.0015511512756347656, -0.0014628171920776367, -0.0013744831085205078, -0.001286149024963379, -0.00119781494140625, -0.001109480857849121, -0.0010211467742919922, -0.0009328126907348633, -0.0008444786071777344, -0.0007561445236206055, -0.0006678104400634766, -0.0005794763565063477, -0.0004911422729492188, -0.00040280818939208984, -0.00031447410583496094, -0.00022614002227783203, -0.00013780593872070312, -4.947185516357422e-05, 3.886222839355469e-05, 0.0001271963119506836, 0.0002155303955078125, 0.0003038644790649414, 0.0003921985626220703, 0.0004805326461791992, 0.0005688667297363281, 0.000657200813293457, 0.0007455348968505859, 0.0008338689804077148, 0.0009222030639648438, 0.0010105371475219727, 0.0010988712310791016, 0.0011872053146362305, 0.0012755393981933594, 0.0013638734817504883, 0.0014522075653076172, 0.001540541648864746, 0.001628875732421875, 0.001717209815979004, 0.0018055438995361328, 0.0018938779830932617, 0.0019822120666503906, 0.0020705461502075195, 0.0021588802337646484, 0.0022472143173217773, 0.0023355484008789062, 0.002423882484436035, 0.002512216567993164, 0.002600550651550293, 0.002688884735107422, 0.0027772188186645508, 0.0028655529022216797, 0.0029538869857788086, 0.0030422210693359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 4.0, 4.0, 4.0, 7.0, 13.0, 9.0, 12.0, 15.0, 13.0, 16.0, 33.0, 63.0, 96.0, 121.0, 132.0, 141.0, 87.0, 62.0, 41.0, 25.0, 20.0, 21.0, 14.0, 6.0, 6.0, 5.0, 7.0, 7.0, 9.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017137527465820312, -0.0016518086194992065, -0.0015898644924163818, -0.0015279203653335571, -0.0014659762382507324, -0.0014040321111679077, -0.001342087984085083, -0.0012801438570022583, -0.0012181997299194336, -0.0011562556028366089, -0.0010943114757537842, -0.0010323673486709595, -0.0009704232215881348, -0.0009084790945053101, -0.0008465349674224854, -0.0007845908403396606, -0.0007226467132568359, -0.0006607025861740112, -0.0005987584590911865, -0.0005368143320083618, -0.0004748702049255371, -0.0004129260778427124, -0.0003509819507598877, -0.000289037823677063, -0.00022709369659423828, -0.00016514956951141357, -0.00010320544242858887, -4.126131534576416e-05, 2.0682811737060547e-05, 8.262693881988525e-05, 0.00014457106590270996, 0.00020651519298553467, 0.0002684593200683594, 0.0003304034471511841, 0.0003923475742340088, 0.0004542917013168335, 0.0005162358283996582, 0.0005781799554824829, 0.0006401240825653076, 0.0007020682096481323, 0.000764012336730957, 0.0008259564638137817, 0.0008879005908966064, 0.0009498447179794312, 0.0010117888450622559, 0.0010737329721450806, 0.0011356770992279053, 0.00119762122631073, 0.0012595653533935547, 0.0013215094804763794, 0.001383453607559204, 0.0014453977346420288, 0.0015073418617248535, 0.0015692859888076782, 0.001631230115890503, 0.0016931742429733276, 0.0017551183700561523, 0.001817062497138977, 0.0018790066242218018, 0.0019409507513046265, 0.002002894878387451, 0.002064839005470276, 0.0021267831325531006, 0.0021887272596359253, 0.00225067138671875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 66.0, 918.0, 34.0, 3.0], "bins": [-0.4222486913204193, -0.41536644101142883, -0.40848419070243835, -0.4016019403934479, -0.3947196900844574, -0.3878374397754669, -0.38095518946647644, -0.37407296895980835, -0.36719071865081787, -0.3603084683418274, -0.3534262180328369, -0.34654396772384644, -0.33966171741485596, -0.3327794671058655, -0.325897216796875, -0.3190149664878845, -0.31213271617889404, -0.30525046586990356, -0.2983682155609131, -0.2914859652519226, -0.28460371494293213, -0.27772146463394165, -0.27083921432495117, -0.2639569640159607, -0.2570747137069702, -0.25019246339797974, -0.24331021308898926, -0.23642796277999878, -0.2295457124710083, -0.22266346216201782, -0.21578122675418854, -0.20889897644519806, -0.20201674103736877, -0.1951344907283783, -0.18825224041938782, -0.18136999011039734, -0.17448773980140686, -0.16760548949241638, -0.1607232540845871, -0.15384100377559662, -0.14695875346660614, -0.14007650315761566, -0.13319425284862518, -0.1263120025396347, -0.11942975968122482, -0.11254750937223434, -0.10566526651382446, -0.09878301620483398, -0.0919007658958435, -0.08501851558685303, -0.07813626527786255, -0.07125402241945267, -0.06437177211046219, -0.05748952180147171, -0.05060727521777153, -0.04372502863407135, -0.03684277832508087, -0.029960529878735542, -0.023078281432390213, -0.016196032986044884, -0.009313784539699554, -0.002431534230709076, 0.004450712352991104, 0.011332958936691284, 0.018215209245681763]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 3.0, 6.0, 2.0, 10.0, 11.0, 10.0, 14.0, 23.0, 20.0, 26.0, 27.0, 32.0, 34.0, 28.0, 35.0, 39.0, 38.0, 43.0, 36.0, 39.0, 49.0, 37.0, 39.0, 37.0, 35.0, 33.0, 37.0, 36.0, 32.0, 42.0, 18.0, 16.0, 16.0, 21.0, 16.0, 16.0, 9.0, 8.0, 6.0, 7.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01556253433227539, -0.015085629187524319, -0.014608724042773247, -0.014131818898022175, -0.013654913753271103, -0.013178008608520031, -0.012701103463768959, -0.012224198319017887, -0.011747293174266815, -0.011270388029515743, -0.010793482884764671, -0.0103165777400136, -0.009839672595262527, -0.009362767450511456, -0.008885862305760384, -0.008408957161009312, -0.00793205201625824, -0.007455146871507168, -0.006978241726756096, -0.006501336582005024, -0.006024431437253952, -0.00554752629250288, -0.005070621147751808, -0.004593716003000736, -0.004116810858249664, -0.0036399057134985924, -0.0031630005687475204, -0.0026860954239964485, -0.0022091902792453766, -0.0017322851344943047, -0.0012553799897432327, -0.0007784748449921608, -0.00030156970024108887, 0.00017533544450998306, 0.000652240589261055, 0.001129145734012127, 0.0016060508787631989, 0.0020829560235142708, 0.0025598611682653427, 0.0030367663130164146, 0.0035136714577674866, 0.0039905766025185585, 0.00446748174726963, 0.004944386892020702, 0.005421292036771774, 0.005898197181522846, 0.006375102326273918, 0.00685200747102499, 0.007328912615776062, 0.007805817760527134, 0.008282722905278206, 0.008759628050029278, 0.00923653319478035, 0.009713438339531422, 0.010190343484282494, 0.010667248629033566, 0.011144153773784637, 0.01162105891853571, 0.012097964063286781, 0.012574869208037853, 0.013051774352788925, 0.013528679497539997, 0.014005584642291069, 0.014482489787042141, 0.014959394931793213]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 6.0, 10.0, 12.0, 15.0, 36.0, 40.0, 53.0, 81.0, 110.0, 352.0, 2674.0, 57348.0, 4123212.0, 7958.0, 1343.0, 594.0, 282.0, 73.0, 24.0, 12.0, 10.0, 8.0, 3.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0295257568359375, -0.028773784637451172, -0.028021812438964844, -0.027269840240478516, -0.026517868041992188, -0.02576589584350586, -0.02501392364501953, -0.024261951446533203, -0.023509979248046875, -0.022758007049560547, -0.02200603485107422, -0.02125406265258789, -0.020502090454101562, -0.019750118255615234, -0.018998146057128906, -0.018246173858642578, -0.01749420166015625, -0.016742229461669922, -0.015990257263183594, -0.015238285064697266, -0.014486312866210938, -0.01373434066772461, -0.012982368469238281, -0.012230396270751953, -0.011478424072265625, -0.010726451873779297, -0.009974479675292969, -0.00922250747680664, -0.008470535278320312, -0.007718563079833984, -0.006966590881347656, -0.006214618682861328, -0.005462646484375, -0.004710674285888672, -0.003958702087402344, -0.0032067298889160156, -0.0024547576904296875, -0.0017027854919433594, -0.0009508132934570312, -0.00019884109497070312, 0.000553131103515625, 0.0013051033020019531, 0.0020570755004882812, 0.0028090476989746094, 0.0035610198974609375, 0.004312992095947266, 0.005064964294433594, 0.005816936492919922, 0.00656890869140625, 0.007320880889892578, 0.008072853088378906, 0.008824825286865234, 0.009576797485351562, 0.01032876968383789, 0.011080741882324219, 0.011832714080810547, 0.012584686279296875, 0.013336658477783203, 0.014088630676269531, 0.01484060287475586, 0.015592575073242188, 0.016344547271728516, 0.017096519470214844, 0.017848491668701172, 0.0186004638671875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 52.0, 220.0, 382.0, 271.0, 72.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0228424072265625, -0.022306084632873535, -0.02176976203918457, -0.021233439445495605, -0.02069711685180664, -0.020160794258117676, -0.01962447166442871, -0.019088149070739746, -0.01855182647705078, -0.018015503883361816, -0.01747918128967285, -0.016942858695983887, -0.016406536102294922, -0.015870213508605957, -0.015333890914916992, -0.014797568321228027, -0.014261245727539062, -0.013724923133850098, -0.013188600540161133, -0.012652277946472168, -0.012115955352783203, -0.011579632759094238, -0.011043310165405273, -0.010506987571716309, -0.009970664978027344, -0.009434342384338379, -0.008898019790649414, -0.00836169719696045, -0.007825374603271484, -0.0072890520095825195, -0.006752729415893555, -0.00621640682220459, -0.005680084228515625, -0.00514376163482666, -0.004607439041137695, -0.0040711164474487305, -0.0035347938537597656, -0.0029984712600708008, -0.002462148666381836, -0.001925826072692871, -0.0013895034790039062, -0.0008531808853149414, -0.00031685829162597656, 0.00021946430206298828, 0.0007557868957519531, 0.001292109489440918, 0.0018284320831298828, 0.0023647546768188477, 0.0029010772705078125, 0.0034373998641967773, 0.003973722457885742, 0.004510045051574707, 0.005046367645263672, 0.005582690238952637, 0.0061190128326416016, 0.006655335426330566, 0.007191658020019531, 0.007727980613708496, 0.008264303207397461, 0.008800625801086426, 0.00933694839477539, 0.009873270988464355, 0.01040959358215332, 0.010945916175842285, 0.01148223876953125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 4.0, 12.0, 13.0, 17.0, 42.0, 89.0, 160.0, 325.0, 658.0, 1466.0, 3841.0, 11532.0, 44343.0, 386063.0, 3572340.0, 135160.0, 25577.0, 7555.0, 2767.0, 1157.0, 542.0, 297.0, 146.0, 70.0, 52.0, 20.0, 13.0, 9.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005008697509765625, -0.004862725734710693, -0.004716753959655762, -0.00457078218460083, -0.0044248104095458984, -0.004278838634490967, -0.004132866859436035, -0.0039868950843811035, -0.003840923309326172, -0.0036949515342712402, -0.0035489797592163086, -0.003403007984161377, -0.0032570362091064453, -0.0031110644340515137, -0.002965092658996582, -0.0028191208839416504, -0.0026731491088867188, -0.002527177333831787, -0.0023812055587768555, -0.002235233783721924, -0.002089262008666992, -0.0019432902336120605, -0.001797318458557129, -0.0016513466835021973, -0.0015053749084472656, -0.001359403133392334, -0.0012134313583374023, -0.0010674595832824707, -0.0009214878082275391, -0.0007755160331726074, -0.0006295442581176758, -0.00048357248306274414, -0.0003376007080078125, -0.00019162893295288086, -4.565715789794922e-05, 0.00010031461715698242, 0.00024628639221191406, 0.0003922581672668457, 0.0005382299423217773, 0.000684201717376709, 0.0008301734924316406, 0.0009761452674865723, 0.001122117042541504, 0.0012680888175964355, 0.0014140605926513672, 0.0015600323677062988, 0.0017060041427612305, 0.0018519759178161621, 0.0019979476928710938, 0.0021439194679260254, 0.002289891242980957, 0.0024358630180358887, 0.0025818347930908203, 0.002727806568145752, 0.0028737783432006836, 0.0030197501182556152, 0.003165721893310547, 0.0033116936683654785, 0.00345766544342041, 0.003603637218475342, 0.0037496089935302734, 0.003895580768585205, 0.004041552543640137, 0.004187524318695068, 0.00433349609375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 4.0, 3.0, 9.0, 12.0, 15.0, 18.0, 26.0, 30.0, 44.0, 76.0, 153.0, 313.0, 651.0, 1407.0, 653.0, 279.0, 133.0, 65.0, 45.0, 28.0, 22.0, 17.0, 14.0, 11.0, 10.0, 9.0, 7.0, 1.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021152496337890625, -0.0020288825035095215, -0.0019425153732299805, -0.0018561482429504395, -0.0017697811126708984, -0.0016834139823913574, -0.0015970468521118164, -0.0015106797218322754, -0.0014243125915527344, -0.0013379454612731934, -0.0012515783309936523, -0.0011652112007141113, -0.0010788440704345703, -0.0009924769401550293, -0.0009061098098754883, -0.0008197426795959473, -0.0007333755493164062, -0.0006470084190368652, -0.0005606412887573242, -0.0004742741584777832, -0.0003879070281982422, -0.00030153989791870117, -0.00021517276763916016, -0.00012880563735961914, -4.2438507080078125e-05, 4.392862319946289e-05, 0.0001302957534790039, 0.00021666288375854492, 0.00030303001403808594, 0.00038939714431762695, 0.00047576427459716797, 0.000562131404876709, 0.00064849853515625, 0.000734865665435791, 0.000821232795715332, 0.000907599925994873, 0.000993967056274414, 0.001080334186553955, 0.001166701316833496, 0.0012530684471130371, 0.0013394355773925781, 0.0014258027076721191, 0.0015121698379516602, 0.0015985369682312012, 0.0016849040985107422, 0.0017712712287902832, 0.0018576383590698242, 0.0019440054893493652, 0.0020303726196289062, 0.0021167397499084473, 0.0022031068801879883, 0.0022894740104675293, 0.0023758411407470703, 0.0024622082710266113, 0.0025485754013061523, 0.0026349425315856934, 0.0027213096618652344, 0.0028076767921447754, 0.0028940439224243164, 0.0029804110527038574, 0.0030667781829833984, 0.0031531453132629395, 0.0032395124435424805, 0.0033258795738220215, 0.0034122467041015625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 6.0, 5.0, 30.0, 94.0, 252.0, 367.0, 158.0, 57.0, 27.0, 9.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00914425402879715, -0.008394983597099781, -0.007645712699741125, -0.006896441802382469, -0.0061471713706851006, -0.005397900938987732, -0.004648630041629076, -0.00389935914427042, -0.0031500887125730515, -0.002400818048045039, -0.001651547383517027, -0.0009022767189890146, -0.00015300605446100235, 0.0005962646100670099, 0.0013455352745950222, 0.002094806171953678, 0.0028440766036510468, 0.003593347268179059, 0.004342617932707071, 0.005091888830065727, 0.005841159261763096, 0.0065904296934604645, 0.00733970059081912, 0.008088971488177776, 0.008838241919875145, 0.009587512351572514, 0.010336782783269882, 0.011086054146289825, 0.011835324577987194, 0.012584595009684563, 0.013333866372704506, 0.014083136804401875, 0.014832407236099243, 0.015581677667796612, 0.01633094809949398, 0.017080219462513924, 0.017829488962888718, 0.01857876032590866, 0.019328031688928604, 0.020077303051948547, 0.02082657255232334, 0.021575843915343285, 0.02232511341571808, 0.023074384778738022, 0.023823656141757965, 0.02457292564213276, 0.025322197005152702, 0.026071466505527496, 0.02682073786854744, 0.027570009231567383, 0.028319278731942177, 0.02906855009496212, 0.029817819595336914, 0.030567090958356857, 0.0313163623213768, 0.032065633684396744, 0.03281490504741669, 0.03356417641043663, 0.034313447773456573, 0.03506271541118622, 0.03581198677420616, 0.036561258137226105, 0.03731052950024605, 0.03805980086326599, 0.038809068500995636]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 9.0, 5.0, 14.0, 14.0, 21.0, 24.0, 26.0, 26.0, 31.0, 42.0, 47.0, 37.0, 62.0, 57.0, 41.0, 54.0, 47.0, 64.0, 56.0, 39.0, 39.0, 40.0, 45.0, 35.0, 28.0, 19.0, 19.0, 14.0, 18.0, 5.0, 6.0, 10.0, 1.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007740318775177002, -0.007511595264077187, -0.007282871752977371, -0.007054148241877556, -0.0068254247307777405, -0.006596701219677925, -0.00636797770857811, -0.006139254197478294, -0.005910530686378479, -0.005681807175278664, -0.005453083664178848, -0.005224360153079033, -0.0049956366419792175, -0.004766913130879402, -0.004538189619779587, -0.004309466108679771, -0.004080742597579956, -0.0038520190864801407, -0.0036232955753803253, -0.00339457206428051, -0.0031658485531806946, -0.002937125042080879, -0.002708401530981064, -0.0024796780198812485, -0.002250954508781433, -0.0020222309976816177, -0.0017935074865818024, -0.001564783975481987, -0.0013360604643821716, -0.0011073369532823563, -0.0008786134421825409, -0.0006498899310827255, -0.00042116641998291016, -0.0001924429088830948, 3.628060221672058e-05, 0.00026500411331653595, 0.0004937276244163513, 0.0007224511355161667, 0.0009511746466159821, 0.0011798981577157974, 0.0014086216688156128, 0.0016373451799154282, 0.0018660686910152435, 0.002094792202115059, 0.0023235157132148743, 0.0025522392243146896, 0.002780962735414505, 0.0030096862465143204, 0.0032384097576141357, 0.003467133268713951, 0.0036958567798137665, 0.003924580290913582, 0.004153303802013397, 0.004382027313113213, 0.004610750824213028, 0.004839474335312843, 0.005068197846412659, 0.005296921357512474, 0.005525644868612289, 0.005754368379712105, 0.00598309189081192, 0.0062118154019117355, 0.006440538913011551, 0.006669262424111366, 0.006897985935211182]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 9.0, 7.0, 10.0, 23.0, 22.0, 42.0, 55.0, 72.0, 119.0, 184.0, 275.0, 511.0, 868.0, 2311.0, 23069.0, 926031.0, 88637.0, 3626.0, 1109.0, 546.0, 372.0, 190.0, 153.0, 87.0, 53.0, 35.0, 41.0, 31.0, 18.0, 17.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0171661376953125, -0.01660609245300293, -0.01604604721069336, -0.015486001968383789, -0.014925956726074219, -0.014365911483764648, -0.013805866241455078, -0.013245820999145508, -0.012685775756835938, -0.012125730514526367, -0.011565685272216797, -0.011005640029907227, -0.010445594787597656, -0.009885549545288086, -0.009325504302978516, -0.008765459060668945, -0.008205413818359375, -0.007645368576049805, -0.007085323333740234, -0.006525278091430664, -0.005965232849121094, -0.0054051876068115234, -0.004845142364501953, -0.004285097122192383, -0.0037250518798828125, -0.003165006637573242, -0.002604961395263672, -0.0020449161529541016, -0.0014848709106445312, -0.0009248256683349609, -0.0003647804260253906, 0.0001952648162841797, 0.00075531005859375, 0.0013153553009033203, 0.0018754005432128906, 0.002435445785522461, 0.0029954910278320312, 0.0035555362701416016, 0.004115581512451172, 0.004675626754760742, 0.0052356719970703125, 0.005795717239379883, 0.006355762481689453, 0.0069158077239990234, 0.007475852966308594, 0.008035898208618164, 0.008595943450927734, 0.009155988693237305, 0.009716033935546875, 0.010276079177856445, 0.010836124420166016, 0.011396169662475586, 0.011956214904785156, 0.012516260147094727, 0.013076305389404297, 0.013636350631713867, 0.014196395874023438, 0.014756441116333008, 0.015316486358642578, 0.01587653160095215, 0.01643657684326172, 0.01699662208557129, 0.01755666732788086, 0.01811671257019043, 0.0186767578125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 13.0, 104.0, 284.0, 391.0, 172.0, 38.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0221405029296875, -0.021616220474243164, -0.021091938018798828, -0.020567655563354492, -0.020043373107910156, -0.01951909065246582, -0.018994808197021484, -0.01847052574157715, -0.017946243286132812, -0.017421960830688477, -0.01689767837524414, -0.016373395919799805, -0.01584911346435547, -0.015324831008911133, -0.014800548553466797, -0.014276266098022461, -0.013751983642578125, -0.013227701187133789, -0.012703418731689453, -0.012179136276245117, -0.011654853820800781, -0.011130571365356445, -0.01060628890991211, -0.010082006454467773, -0.009557723999023438, -0.009033441543579102, -0.008509159088134766, -0.00798487663269043, -0.007460594177246094, -0.006936311721801758, -0.006412029266357422, -0.005887746810913086, -0.00536346435546875, -0.004839181900024414, -0.004314899444580078, -0.003790616989135742, -0.0032663345336914062, -0.0027420520782470703, -0.0022177696228027344, -0.0016934871673583984, -0.0011692047119140625, -0.0006449222564697266, -0.00012063980102539062, 0.0004036426544189453, 0.0009279251098632812, 0.0014522075653076172, 0.001976490020751953, 0.002500772476196289, 0.003025054931640625, 0.003549337387084961, 0.004073619842529297, 0.004597902297973633, 0.005122184753417969, 0.005646467208862305, 0.006170749664306641, 0.0066950321197509766, 0.0072193145751953125, 0.0077435970306396484, 0.008267879486083984, 0.00879216194152832, 0.009316444396972656, 0.009840726852416992, 0.010365009307861328, 0.010889291763305664, 0.01141357421875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 6.0, 3.0, 1.0, 3.0, 3.0, 8.0, 11.0, 10.0, 8.0, 18.0, 25.0, 23.0, 31.0, 33.0, 68.0, 85.0, 113.0, 187.0, 363.0, 761.0, 2150.0, 9062.0, 49895.0, 322945.0, 530083.0, 109008.0, 17443.0, 3874.0, 1152.0, 465.0, 229.0, 157.0, 97.0, 50.0, 41.0, 24.0, 28.0, 19.0, 12.0, 15.0, 14.0, 11.0, 12.0, 8.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005218505859375, -0.005026698112487793, -0.004834890365600586, -0.004643082618713379, -0.004451274871826172, -0.004259467124938965, -0.004067659378051758, -0.0038758516311645508, -0.0036840438842773438, -0.0034922361373901367, -0.0033004283905029297, -0.0031086206436157227, -0.0029168128967285156, -0.0027250051498413086, -0.0025331974029541016, -0.0023413896560668945, -0.0021495819091796875, -0.0019577741622924805, -0.0017659664154052734, -0.0015741586685180664, -0.0013823509216308594, -0.0011905431747436523, -0.0009987354278564453, -0.0008069276809692383, -0.0006151199340820312, -0.0004233121871948242, -0.0002315044403076172, -3.9696693420410156e-05, 0.00015211105346679688, 0.0003439188003540039, 0.0005357265472412109, 0.000727534294128418, 0.000919342041015625, 0.001111149787902832, 0.001302957534790039, 0.001494765281677246, 0.0016865730285644531, 0.0018783807754516602, 0.002070188522338867, 0.0022619962692260742, 0.0024538040161132812, 0.0026456117630004883, 0.0028374195098876953, 0.0030292272567749023, 0.0032210350036621094, 0.0034128427505493164, 0.0036046504974365234, 0.0037964582443237305, 0.0039882659912109375, 0.0041800737380981445, 0.0043718814849853516, 0.004563689231872559, 0.004755496978759766, 0.004947304725646973, 0.00513911247253418, 0.005330920219421387, 0.005522727966308594, 0.005714535713195801, 0.005906343460083008, 0.006098151206970215, 0.006289958953857422, 0.006481766700744629, 0.006673574447631836, 0.006865382194519043, 0.00705718994140625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 4.0, 11.0, 6.0, 9.0, 20.0, 11.0, 12.0, 12.0, 19.0, 21.0, 16.0, 20.0, 38.0, 31.0, 44.0, 28.0, 40.0, 48.0, 45.0, 56.0, 40.0, 51.0, 43.0, 43.0, 40.0, 35.0, 27.0, 36.0, 34.0, 30.0, 14.0, 24.0, 22.0, 16.0, 13.0, 8.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.005397796630859375, -0.005241692066192627, -0.005085587501525879, -0.004929482936859131, -0.004773378372192383, -0.004617273807525635, -0.004461169242858887, -0.004305064678192139, -0.004148960113525391, -0.003992855548858643, -0.0038367509841918945, -0.0036806464195251465, -0.0035245418548583984, -0.0033684372901916504, -0.0032123327255249023, -0.0030562281608581543, -0.0029001235961914062, -0.002744019031524658, -0.00258791446685791, -0.002431809902191162, -0.002275705337524414, -0.002119600772857666, -0.001963496208190918, -0.00180739164352417, -0.0016512870788574219, -0.0014951825141906738, -0.0013390779495239258, -0.0011829733848571777, -0.0010268688201904297, -0.0008707642555236816, -0.0007146596908569336, -0.0005585551261901855, -0.0004024505615234375, -0.00024634599685668945, -9.02414321899414e-05, 6.586313247680664e-05, 0.0002219676971435547, 0.00037807226181030273, 0.0005341768264770508, 0.0006902813911437988, 0.0008463859558105469, 0.001002490520477295, 0.001158595085144043, 0.001314699649810791, 0.001470804214477539, 0.0016269087791442871, 0.0017830133438110352, 0.0019391179084777832, 0.0020952224731445312, 0.0022513270378112793, 0.0024074316024780273, 0.0025635361671447754, 0.0027196407318115234, 0.0028757452964782715, 0.0030318498611450195, 0.0031879544258117676, 0.0033440589904785156, 0.0035001635551452637, 0.0036562681198120117, 0.0038123726844787598, 0.003968477249145508, 0.004124581813812256, 0.004280686378479004, 0.004436790943145752, 0.0045928955078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 4.0, 10.0, 10.0, 16.0, 21.0, 27.0, 27.0, 49.0, 73.0, 105.0, 165.0, 201.0, 276.0, 429.0, 623.0, 848.0, 1265.0, 1901.0, 2790.0, 4324.0, 6696.0, 10670.0, 17801.0, 32638.0, 64685.0, 139243.0, 263014.0, 244578.0, 123454.0, 57992.0, 29792.0, 16479.0, 9903.0, 6105.0, 3829.0, 2639.0, 1833.0, 1272.0, 822.0, 626.0, 375.0, 281.0, 213.0, 132.0, 84.0, 73.0, 51.0, 40.0, 21.0, 19.0, 9.0, 10.0, 5.0, 5.0, 2.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0007758140563964844, -0.0007498860359191895, -0.0007239580154418945, -0.0006980299949645996, -0.0006721019744873047, -0.0006461739540100098, -0.0006202459335327148, -0.0005943179130554199, -0.000568389892578125, -0.0005424618721008301, -0.0005165338516235352, -0.0004906058311462402, -0.0004646778106689453, -0.0004387497901916504, -0.00041282176971435547, -0.00038689374923706055, -0.0003609657287597656, -0.0003350377082824707, -0.0003091096878051758, -0.00028318166732788086, -0.00025725364685058594, -0.00023132562637329102, -0.0002053976058959961, -0.00017946958541870117, -0.00015354156494140625, -0.00012761354446411133, -0.0001016855239868164, -7.575750350952148e-05, -4.982948303222656e-05, -2.390146255493164e-05, 2.0265579223632812e-06, 2.7954578399658203e-05, 5.3882598876953125e-05, 7.981061935424805e-05, 0.00010573863983154297, 0.0001316666603088379, 0.0001575946807861328, 0.00018352270126342773, 0.00020945072174072266, 0.00023537874221801758, 0.0002613067626953125, 0.0002872347831726074, 0.00031316280364990234, 0.00033909082412719727, 0.0003650188446044922, 0.0003909468650817871, 0.00041687488555908203, 0.00044280290603637695, 0.0004687309265136719, 0.0004946589469909668, 0.0005205869674682617, 0.0005465149879455566, 0.0005724430084228516, 0.0005983710289001465, 0.0006242990493774414, 0.0006502270698547363, 0.0006761550903320312, 0.0007020831108093262, 0.0007280111312866211, 0.000753939151763916, 0.0007798671722412109, 0.0008057951927185059, 0.0008317232131958008, 0.0008576512336730957, 0.0008835792541503906]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 9.0, 12.0, 12.0, 21.0, 21.0, 20.0, 52.0, 65.0, 69.0, 100.0, 114.0, 98.0, 89.0, 78.0, 46.0, 51.0, 45.0, 35.0, 15.0, 22.0, 8.0, 7.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.191036224365234e-05, -8.885841816663742e-05, -8.58064740896225e-05, -8.275453001260757e-05, -7.970258593559265e-05, -7.665064185857773e-05, -7.35986977815628e-05, -7.054675370454788e-05, -6.749480962753296e-05, -6.444286555051804e-05, -6.139092147350311e-05, -5.833897739648819e-05, -5.5287033319473267e-05, -5.2235089242458344e-05, -4.918314516544342e-05, -4.61312010884285e-05, -4.3079257011413574e-05, -4.002731293439865e-05, -3.697536885738373e-05, -3.3923424780368805e-05, -3.087148070335388e-05, -2.781953662633896e-05, -2.4767592549324036e-05, -2.1715648472309113e-05, -1.866370439529419e-05, -1.5611760318279266e-05, -1.2559816241264343e-05, -9.50787216424942e-06, -6.455928087234497e-06, -3.403984010219574e-06, -3.520399332046509e-07, 2.6999041438102722e-06, 5.751848220825195e-06, 8.803792297840118e-06, 1.1855736374855042e-05, 1.4907680451869965e-05, 1.7959624528884888e-05, 2.101156860589981e-05, 2.4063512682914734e-05, 2.7115456759929657e-05, 3.016740083694458e-05, 3.32193449139595e-05, 3.6271288990974426e-05, 3.932323306798935e-05, 4.237517714500427e-05, 4.5427121222019196e-05, 4.847906529903412e-05, 5.153100937604904e-05, 5.4582953453063965e-05, 5.763489753007889e-05, 6.068684160709381e-05, 6.373878568410873e-05, 6.679072976112366e-05, 6.984267383813858e-05, 7.28946179151535e-05, 7.594656199216843e-05, 7.899850606918335e-05, 8.205045014619827e-05, 8.51023942232132e-05, 8.815433830022812e-05, 9.120628237724304e-05, 9.425822645425797e-05, 9.731017053127289e-05, 0.00010036211460828781, 0.00010341405868530273]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 3.0, 16.0, 17.0, 32.0, 57.0, 94.0, 166.0, 399.0, 870.0, 2321.0, 7664.0, 35871.0, 379659.0, 559314.0, 47928.0, 9431.0, 2769.0, 1004.0, 456.0, 207.0, 121.0, 64.0, 33.0, 24.0, 13.0, 5.0, 3.0, 3.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.004680633544921875, -0.0045768022537231445, -0.004472970962524414, -0.004369139671325684, -0.004265308380126953, -0.004161477088928223, -0.004057645797729492, -0.003953814506530762, -0.0038499832153320312, -0.0037461519241333008, -0.0036423206329345703, -0.00353848934173584, -0.0034346580505371094, -0.003330826759338379, -0.0032269954681396484, -0.003123164176940918, -0.0030193328857421875, -0.002915501594543457, -0.0028116703033447266, -0.002707839012145996, -0.0026040077209472656, -0.002500176429748535, -0.0023963451385498047, -0.0022925138473510742, -0.0021886825561523438, -0.0020848512649536133, -0.001981019973754883, -0.0018771886825561523, -0.0017733573913574219, -0.0016695261001586914, -0.001565694808959961, -0.0014618635177612305, -0.0013580322265625, -0.0012542009353637695, -0.001150369644165039, -0.0010465383529663086, -0.0009427070617675781, -0.0008388757705688477, -0.0007350444793701172, -0.0006312131881713867, -0.0005273818969726562, -0.0004235506057739258, -0.0003197193145751953, -0.00021588802337646484, -0.00011205673217773438, -8.225440979003906e-06, 9.560585021972656e-05, 0.00019943714141845703, 0.0003032684326171875, 0.00040709972381591797, 0.0005109310150146484, 0.0006147623062133789, 0.0007185935974121094, 0.0008224248886108398, 0.0009262561798095703, 0.0010300874710083008, 0.0011339187622070312, 0.0012377500534057617, 0.0013415813446044922, 0.0014454126358032227, 0.0015492439270019531, 0.0016530752182006836, 0.001756906509399414, 0.0018607378005981445, 0.001964569091796875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 5.0, 8.0, 13.0, 16.0, 21.0, 37.0, 46.0, 59.0, 90.0, 114.0, 149.0, 113.0, 104.0, 74.0, 49.0, 29.0, 20.0, 11.0, 11.0, 7.0, 7.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00127410888671875, -0.001201331615447998, -0.001128554344177246, -0.0010557770729064941, -0.0009829998016357422, -0.0009102225303649902, -0.0008374452590942383, -0.0007646679878234863, -0.0006918907165527344, -0.0006191134452819824, -0.0005463361740112305, -0.0004735589027404785, -0.00040078163146972656, -0.0003280043601989746, -0.00025522708892822266, -0.0001824498176574707, -0.00010967254638671875, -3.68952751159668e-05, 3.5881996154785156e-05, 0.00010865926742553711, 0.00018143653869628906, 0.000254213809967041, 0.00032699108123779297, 0.0003997683525085449, 0.0004725456237792969, 0.0005453228950500488, 0.0006181001663208008, 0.0006908774375915527, 0.0007636547088623047, 0.0008364319801330566, 0.0009092092514038086, 0.0009819865226745605, 0.0010547637939453125, 0.0011275410652160645, 0.0012003183364868164, 0.0012730956077575684, 0.0013458728790283203, 0.0014186501502990723, 0.0014914274215698242, 0.0015642046928405762, 0.0016369819641113281, 0.00170975923538208, 0.001782536506652832, 0.001855313777923584, 0.001928091049194336, 0.002000868320465088, 0.00207364559173584, 0.002146422863006592, 0.0022192001342773438, 0.0022919774055480957, 0.0023647546768188477, 0.0024375319480895996, 0.0025103092193603516, 0.0025830864906311035, 0.0026558637619018555, 0.0027286410331726074, 0.0028014183044433594, 0.0028741955757141113, 0.0029469728469848633, 0.0030197501182556152, 0.003092527389526367, 0.003165304660797119, 0.003238081932067871, 0.003310859203338623, 0.003383636474609375]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 823.0, 193.0, 1.0], "bins": [-0.6950159072875977, -0.6837791800498962, -0.6725425124168396, -0.6613057851791382, -0.6500691175460815, -0.6388323903083801, -0.6275957226753235, -0.6163589954376221, -0.6051223278045654, -0.593885600566864, -0.5826489329338074, -0.571412205696106, -0.5601755380630493, -0.5489388108253479, -0.5377021431922913, -0.5264654159545898, -0.5152286887168884, -0.503991961479187, -0.49275529384613037, -0.48151859641075134, -0.4702818989753723, -0.4590451717376709, -0.44780850410461426, -0.43657177686691284, -0.4253351092338562, -0.4140984117984772, -0.40286171436309814, -0.3916250169277191, -0.3803883194923401, -0.36915159225463867, -0.35791492462158203, -0.3466781973838806, -0.3354414701461792, -0.32420477271080017, -0.31296807527542114, -0.3017313778400421, -0.2904946804046631, -0.27925795316696167, -0.26802128553390503, -0.2567845582962036, -0.24554787576198578, -0.23431117832660675, -0.22307448089122772, -0.2118377685546875, -0.20060107111930847, -0.18936437368392944, -0.17812767624855042, -0.1668909788131714, -0.15565426647663116, -0.14441756904125214, -0.1331808716058731, -0.12194416671991348, -0.11070746183395386, -0.09947076439857483, -0.0882340669631958, -0.07699736207723618, -0.06576067209243774, -0.05452397093176842, -0.04328726977109909, -0.03205057233572006, -0.020813871175050735, -0.009577170014381409, 0.0016595274209976196, 0.012896232306957245, 0.024132931604981422]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 5.0, 10.0, 12.0, 10.0, 16.0, 18.0, 26.0, 38.0, 40.0, 48.0, 53.0, 40.0, 60.0, 53.0, 48.0, 43.0, 54.0, 66.0, 42.0, 49.0, 41.0, 31.0, 29.0, 32.0, 21.0, 26.0, 20.0, 17.0, 17.0, 13.0, 9.0, 9.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013702332973480225, -0.013105371966958046, -0.012508410960435867, -0.011911449953913689, -0.01131448894739151, -0.010717527940869331, -0.010120566934347153, -0.009523605927824974, -0.008926644921302795, -0.008329683914780617, -0.007732722908258438, -0.0071357619017362595, -0.006538800895214081, -0.005941839888691902, -0.0053448788821697235, -0.004747917875647545, -0.004150956869125366, -0.0035539958626031876, -0.002957034856081009, -0.0023600738495588303, -0.0017631128430366516, -0.001166151836514473, -0.0005691908299922943, 2.777017652988434e-05, 0.000624731183052063, 0.0012216921895742416, 0.0018186531960964203, 0.002415614202618599, 0.0030125752091407776, 0.0036095362156629562, 0.004206497222185135, 0.0048034582287073135, 0.005400419235229492, 0.005997380241751671, 0.0065943412482738495, 0.007191302254796028, 0.007788263261318207, 0.008385224267840385, 0.008982185274362564, 0.009579146280884743, 0.010176107287406921, 0.0107730682939291, 0.011370029300451279, 0.011966990306973457, 0.012563951313495636, 0.013160912320017815, 0.013757873326539993, 0.014354834333062172, 0.01495179533958435, 0.01554875634610653, 0.016145717352628708, 0.016742678359150887, 0.017339639365673065, 0.017936600372195244, 0.018533561378717422, 0.0191305223852396, 0.01972748339176178, 0.02032444439828396, 0.020921405404806137, 0.021518366411328316, 0.022115327417850494, 0.022712288424372673, 0.02330924943089485, 0.02390621043741703, 0.02450317144393921]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 14.0, 12.0, 13.0, 17.0, 30.0, 46.0, 66.0, 103.0, 228.0, 1827.0, 14879.0, 4150689.0, 22584.0, 2360.0, 774.0, 434.0, 110.0, 33.0, 19.0, 10.0, 11.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0262298583984375, -0.025492191314697266, -0.02475452423095703, -0.024016857147216797, -0.023279190063476562, -0.022541522979736328, -0.021803855895996094, -0.02106618881225586, -0.020328521728515625, -0.01959085464477539, -0.018853187561035156, -0.018115520477294922, -0.017377853393554688, -0.016640186309814453, -0.01590251922607422, -0.015164852142333984, -0.01442718505859375, -0.013689517974853516, -0.012951850891113281, -0.012214183807373047, -0.011476516723632812, -0.010738849639892578, -0.010001182556152344, -0.00926351547241211, -0.008525848388671875, -0.007788181304931641, -0.007050514221191406, -0.006312847137451172, -0.0055751800537109375, -0.004837512969970703, -0.004099845886230469, -0.0033621788024902344, -0.00262451171875, -0.0018868446350097656, -0.0011491775512695312, -0.0004115104675292969, 0.0003261566162109375, 0.0010638236999511719, 0.0018014907836914062, 0.0025391578674316406, 0.003276824951171875, 0.004014492034912109, 0.004752159118652344, 0.005489826202392578, 0.0062274932861328125, 0.006965160369873047, 0.007702827453613281, 0.008440494537353516, 0.00917816162109375, 0.009915828704833984, 0.010653495788574219, 0.011391162872314453, 0.012128829956054688, 0.012866497039794922, 0.013604164123535156, 0.01434183120727539, 0.015079498291015625, 0.01581716537475586, 0.016554832458496094, 0.017292499542236328, 0.018030166625976562, 0.018767833709716797, 0.01950550079345703, 0.020243167877197266, 0.0209808349609375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 19.0, 112.0, 308.0, 374.0, 162.0, 27.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.022003173828125, -0.021480560302734375, -0.02095794677734375, -0.020435333251953125, -0.0199127197265625, -0.019390106201171875, -0.01886749267578125, -0.018344879150390625, -0.017822265625, -0.017299652099609375, -0.01677703857421875, -0.016254425048828125, -0.0157318115234375, -0.015209197998046875, -0.01468658447265625, -0.014163970947265625, -0.013641357421875, -0.013118743896484375, -0.01259613037109375, -0.012073516845703125, -0.0115509033203125, -0.011028289794921875, -0.01050567626953125, -0.009983062744140625, -0.00946044921875, -0.008937835693359375, -0.00841522216796875, -0.007892608642578125, -0.0073699951171875, -0.006847381591796875, -0.00632476806640625, -0.005802154541015625, -0.005279541015625, -0.004756927490234375, -0.00423431396484375, -0.003711700439453125, -0.0031890869140625, -0.002666473388671875, -0.00214385986328125, -0.001621246337890625, -0.0010986328125, -0.000576019287109375, -5.340576171875e-05, 0.000469207763671875, 0.0009918212890625, 0.001514434814453125, 0.00203704833984375, 0.002559661865234375, 0.003082275390625, 0.003604888916015625, 0.00412750244140625, 0.004650115966796875, 0.0051727294921875, 0.005695343017578125, 0.00621795654296875, 0.006740570068359375, 0.00726318359375, 0.007785797119140625, 0.00830841064453125, 0.008831024169921875, 0.0093536376953125, 0.009876251220703125, 0.01039886474609375, 0.010921478271484375, 0.011444091796875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 18.0, 19.0, 23.0, 33.0, 38.0, 62.0, 127.0, 157.0, 304.0, 672.0, 1794.0, 6164.0, 29341.0, 291572.0, 3721948.0, 118096.0, 17347.0, 4018.0, 1337.0, 532.0, 236.0, 126.0, 85.0, 55.0, 39.0, 37.0, 22.0, 19.0, 11.0, 10.0, 11.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005519866943359375, -0.005337953567504883, -0.005156040191650391, -0.0049741268157958984, -0.004792213439941406, -0.004610300064086914, -0.004428386688232422, -0.00424647331237793, -0.0040645599365234375, -0.0038826465606689453, -0.003700733184814453, -0.003518819808959961, -0.0033369064331054688, -0.0031549930572509766, -0.0029730796813964844, -0.002791166305541992, -0.0026092529296875, -0.002427339553833008, -0.0022454261779785156, -0.0020635128021240234, -0.0018815994262695312, -0.001699686050415039, -0.0015177726745605469, -0.0013358592987060547, -0.0011539459228515625, -0.0009720325469970703, -0.0007901191711425781, -0.0006082057952880859, -0.00042629241943359375, -0.00024437904357910156, -6.246566772460938e-05, 0.00011944770812988281, 0.000301361083984375, 0.0004832744598388672, 0.0006651878356933594, 0.0008471012115478516, 0.0010290145874023438, 0.001210927963256836, 0.0013928413391113281, 0.0015747547149658203, 0.0017566680908203125, 0.0019385814666748047, 0.002120494842529297, 0.002302408218383789, 0.0024843215942382812, 0.0026662349700927734, 0.0028481483459472656, 0.003030061721801758, 0.00321197509765625, 0.003393888473510742, 0.0035758018493652344, 0.0037577152252197266, 0.003939628601074219, 0.004121541976928711, 0.004303455352783203, 0.004485368728637695, 0.0046672821044921875, 0.00484919548034668, 0.005031108856201172, 0.005213022232055664, 0.005394935607910156, 0.0055768489837646484, 0.005758762359619141, 0.005940675735473633, 0.006122589111328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 2.0, 0.0, 5.0, 9.0, 12.0, 15.0, 19.0, 33.0, 57.0, 84.0, 218.0, 767.0, 1762.0, 633.0, 194.0, 81.0, 60.0, 41.0, 26.0, 19.0, 11.0, 7.0, 11.0, 5.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.003185272216796875, -0.0030295848846435547, -0.0028738975524902344, -0.002718210220336914, -0.0025625228881835938, -0.0024068355560302734, -0.002251148223876953, -0.002095460891723633, -0.0019397735595703125, -0.0017840862274169922, -0.0016283988952636719, -0.0014727115631103516, -0.0013170242309570312, -0.001161336898803711, -0.0010056495666503906, -0.0008499622344970703, -0.00069427490234375, -0.0005385875701904297, -0.0003829002380371094, -0.00022721290588378906, -7.152557373046875e-05, 8.416175842285156e-05, 0.00023984909057617188, 0.0003955364227294922, 0.0005512237548828125, 0.0007069110870361328, 0.0008625984191894531, 0.0010182857513427734, 0.0011739730834960938, 0.001329660415649414, 0.0014853477478027344, 0.0016410350799560547, 0.001796722412109375, 0.0019524097442626953, 0.0021080970764160156, 0.002263784408569336, 0.0024194717407226562, 0.0025751590728759766, 0.002730846405029297, 0.002886533737182617, 0.0030422210693359375, 0.003197908401489258, 0.003353595733642578, 0.0035092830657958984, 0.0036649703979492188, 0.003820657730102539, 0.003976345062255859, 0.00413203239440918, 0.0042877197265625, 0.00444340705871582, 0.004599094390869141, 0.004754781723022461, 0.004910469055175781, 0.0050661563873291016, 0.005221843719482422, 0.005377531051635742, 0.0055332183837890625, 0.005688905715942383, 0.005844593048095703, 0.0060002803802490234, 0.006155967712402344, 0.006311655044555664, 0.006467342376708984, 0.006623029708862305, 0.006778717041015625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 24.0, 95.0, 326.0, 361.0, 130.0, 41.0, 16.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022929366677999496, -0.021781951189041138, -0.02063453570008278, -0.01948712021112442, -0.01833970472216606, -0.017192289233207703, -0.016044875606894493, -0.014897460117936134, -0.013750044628977776, -0.012602629140019417, -0.011455213651061058, -0.010307799093425274, -0.009160383604466915, -0.008012968115508556, -0.006865553092211485, -0.0057181380689144135, -0.004570722579956055, -0.0034233073238283396, -0.0022758920677006245, -0.0011284768115729094, 1.8938444554805756e-05, 0.0011663539335131645, 0.002313768956810236, 0.0034611839801073074, 0.004608599469065666, 0.005756014958024025, 0.006903429981321096, 0.008050845004618168, 0.009198260493576527, 0.010345675982534885, 0.01149309054017067, 0.012640506029129028, 0.013787917792797089, 0.014935333281755447, 0.016082748770713806, 0.017230164259672165, 0.018377579748630524, 0.019524995237588882, 0.020672408863902092, 0.02181982435286045, 0.02296723984181881, 0.02411465533077717, 0.025262070819735527, 0.026409486308693886, 0.027556899935007095, 0.028704315423965454, 0.029851730912923813, 0.03099914640188217, 0.03214656189084053, 0.03329397737979889, 0.03444139286875725, 0.03558880835771561, 0.036736223846673965, 0.037883639335632324, 0.03903105482459068, 0.04017847031354904, 0.0413258820772171, 0.04247329756617546, 0.04362071305513382, 0.04476812854409218, 0.04591554403305054, 0.047062959522008896, 0.048210375010967255, 0.049357786774635315, 0.05050520598888397]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 4.0, 4.0, 7.0, 7.0, 9.0, 12.0, 14.0, 16.0, 13.0, 28.0, 35.0, 28.0, 33.0, 23.0, 38.0, 39.0, 35.0, 48.0, 51.0, 46.0, 32.0, 51.0, 46.0, 45.0, 33.0, 38.0, 29.0, 33.0, 27.0, 26.0, 23.0, 31.0, 12.0, 14.0, 14.0, 14.0, 8.0, 7.0, 8.0, 2.0, 6.0, 7.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.008240103721618652, -0.007956666871905327, -0.007673230022192001, -0.007389793172478676, -0.00710635632276535, -0.006822919473052025, -0.006539482623338699, -0.006256045773625374, -0.005972608923912048, -0.005689172074198723, -0.005405735224485397, -0.005122298374772072, -0.004838861525058746, -0.004555424675345421, -0.004271987825632095, -0.00398855097591877, -0.0037051141262054443, -0.003421677276492119, -0.0031382404267787933, -0.002854803577065468, -0.0025713667273521423, -0.002287929877638817, -0.0020044930279254913, -0.0017210561782121658, -0.0014376193284988403, -0.0011541824787855148, -0.0008707456290721893, -0.0005873087793588638, -0.00030387192964553833, -2.043507993221283e-05, 0.00026300176978111267, 0.0005464386194944382, 0.0008298754692077637, 0.0011133123189210892, 0.0013967491686344147, 0.0016801860183477402, 0.0019636228680610657, 0.002247059717774391, 0.0025304965674877167, 0.002813933417201042, 0.0030973702669143677, 0.003380807116627693, 0.0036642439663410187, 0.003947680816054344, 0.00423111766576767, 0.004514554515480995, 0.004797991365194321, 0.005081428214907646, 0.005364865064620972, 0.005648301914334297, 0.005931738764047623, 0.006215175613760948, 0.006498612463474274, 0.006782049313187599, 0.007065486162900925, 0.00734892301261425, 0.007632359862327576, 0.007915796712040901, 0.008199233561754227, 0.008482670411467552, 0.008766107261180878, 0.009049544110894203, 0.009332980960607529, 0.009616417810320854, 0.00989985466003418]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 5.0, 4.0, 8.0, 12.0, 18.0, 18.0, 29.0, 44.0, 54.0, 73.0, 131.0, 141.0, 244.0, 369.0, 626.0, 1124.0, 4424.0, 81172.0, 902611.0, 50985.0, 3675.0, 1079.0, 598.0, 339.0, 255.0, 140.0, 92.0, 68.0, 65.0, 35.0, 31.0, 26.0, 12.0, 9.0, 9.0, 8.0, 6.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-0.0218353271484375, -0.021267294883728027, -0.020699262619018555, -0.020131230354309082, -0.01956319808959961, -0.018995165824890137, -0.018427133560180664, -0.01785910129547119, -0.01729106903076172, -0.016723036766052246, -0.016155004501342773, -0.0155869722366333, -0.015018939971923828, -0.014450907707214355, -0.013882875442504883, -0.01331484317779541, -0.012746810913085938, -0.012178778648376465, -0.011610746383666992, -0.01104271411895752, -0.010474681854248047, -0.009906649589538574, -0.009338617324829102, -0.008770585060119629, -0.008202552795410156, -0.007634520530700684, -0.007066488265991211, -0.006498456001281738, -0.005930423736572266, -0.005362391471862793, -0.00479435920715332, -0.004226326942443848, -0.003658294677734375, -0.0030902624130249023, -0.0025222301483154297, -0.001954197883605957, -0.0013861656188964844, -0.0008181333541870117, -0.00025010108947753906, 0.0003179311752319336, 0.0008859634399414062, 0.001453995704650879, 0.0020220279693603516, 0.0025900602340698242, 0.003158092498779297, 0.0037261247634887695, 0.004294157028198242, 0.004862189292907715, 0.0054302215576171875, 0.00599825382232666, 0.006566286087036133, 0.0071343183517456055, 0.007702350616455078, 0.00827038288116455, 0.008838415145874023, 0.009406447410583496, 0.009974479675292969, 0.010542511940002441, 0.011110544204711914, 0.011678576469421387, 0.01224660873413086, 0.012814640998840332, 0.013382673263549805, 0.013950705528259277, 0.01451873779296875]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 26.0, 146.0, 388.0, 306.0, 121.0, 17.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0228424072265625, -0.02230978012084961, -0.02177715301513672, -0.021244525909423828, -0.020711898803710938, -0.020179271697998047, -0.019646644592285156, -0.019114017486572266, -0.018581390380859375, -0.018048763275146484, -0.017516136169433594, -0.016983509063720703, -0.016450881958007812, -0.015918254852294922, -0.015385627746582031, -0.01485300064086914, -0.01432037353515625, -0.01378774642944336, -0.013255119323730469, -0.012722492218017578, -0.012189865112304688, -0.011657238006591797, -0.011124610900878906, -0.010591983795166016, -0.010059356689453125, -0.009526729583740234, -0.008994102478027344, -0.008461475372314453, -0.007928848266601562, -0.007396221160888672, -0.006863594055175781, -0.006330966949462891, -0.00579833984375, -0.005265712738037109, -0.004733085632324219, -0.004200458526611328, -0.0036678314208984375, -0.003135204315185547, -0.0026025772094726562, -0.0020699501037597656, -0.001537322998046875, -0.0010046958923339844, -0.00047206878662109375, 6.0558319091796875e-05, 0.0005931854248046875, 0.0011258125305175781, 0.0016584396362304688, 0.0021910667419433594, 0.00272369384765625, 0.0032563209533691406, 0.0037889480590820312, 0.004321575164794922, 0.0048542022705078125, 0.005386829376220703, 0.005919456481933594, 0.006452083587646484, 0.006984710693359375, 0.007517337799072266, 0.008049964904785156, 0.008582592010498047, 0.009115219116210938, 0.009647846221923828, 0.010180473327636719, 0.01071310043334961, 0.0112457275390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 5.0, 8.0, 8.0, 19.0, 23.0, 37.0, 38.0, 45.0, 65.0, 95.0, 115.0, 191.0, 259.0, 389.0, 687.0, 1201.0, 2477.0, 5664.0, 15226.0, 46995.0, 164977.0, 419182.0, 272438.0, 79240.0, 23524.0, 8163.0, 3371.0, 1647.0, 858.0, 531.0, 317.0, 187.0, 145.0, 114.0, 82.0, 53.0, 44.0, 28.0, 20.0, 23.0, 12.0, 10.0, 10.0, 6.0, 8.0, 5.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.004901885986328125, -0.004742264747619629, -0.004582643508911133, -0.004423022270202637, -0.004263401031494141, -0.0041037797927856445, -0.0039441585540771484, -0.0037845373153686523, -0.0036249160766601562, -0.00346529483795166, -0.003305673599243164, -0.003146052360534668, -0.002986431121826172, -0.0028268098831176758, -0.0026671886444091797, -0.0025075674057006836, -0.0023479461669921875, -0.0021883249282836914, -0.0020287036895751953, -0.0018690824508666992, -0.0017094612121582031, -0.001549839973449707, -0.001390218734741211, -0.0012305974960327148, -0.0010709762573242188, -0.0009113550186157227, -0.0007517337799072266, -0.0005921125411987305, -0.0004324913024902344, -0.0002728700637817383, -0.00011324882507324219, 4.6372413635253906e-05, 0.00020599365234375, 0.0003656148910522461, 0.0005252361297607422, 0.0006848573684692383, 0.0008444786071777344, 0.0010040998458862305, 0.0011637210845947266, 0.0013233423233032227, 0.0014829635620117188, 0.0016425848007202148, 0.001802206039428711, 0.001961827278137207, 0.002121448516845703, 0.0022810697555541992, 0.0024406909942626953, 0.0026003122329711914, 0.0027599334716796875, 0.0029195547103881836, 0.0030791759490966797, 0.0032387971878051758, 0.003398418426513672, 0.003558039665222168, 0.003717660903930664, 0.00387728214263916, 0.004036903381347656, 0.004196524620056152, 0.0043561458587646484, 0.0045157670974731445, 0.004675388336181641, 0.004835009574890137, 0.004994630813598633, 0.005154252052307129, 0.005313873291015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 7.0, 10.0, 13.0, 26.0, 23.0, 22.0, 36.0, 21.0, 34.0, 38.0, 47.0, 48.0, 53.0, 62.0, 58.0, 59.0, 52.0, 48.0, 53.0, 40.0, 32.0, 38.0, 28.0, 20.0, 25.0, 13.0, 18.0, 17.0, 11.0, 14.0, 5.0, 5.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006908416748046875, -0.006679356098175049, -0.006450295448303223, -0.0062212347984313965, -0.00599217414855957, -0.005763113498687744, -0.005534052848815918, -0.005304992198944092, -0.005075931549072266, -0.0048468708992004395, -0.004617810249328613, -0.004388749599456787, -0.004159688949584961, -0.003930628299713135, -0.0037015676498413086, -0.0034725069999694824, -0.0032434463500976562, -0.00301438570022583, -0.002785325050354004, -0.0025562644004821777, -0.0023272037506103516, -0.0020981431007385254, -0.0018690824508666992, -0.001640021800994873, -0.0014109611511230469, -0.0011819005012512207, -0.0009528398513793945, -0.0007237792015075684, -0.0004947185516357422, -0.000265657901763916, -3.6597251892089844e-05, 0.00019246339797973633, 0.0004215240478515625, 0.0006505846977233887, 0.0008796453475952148, 0.001108705997467041, 0.0013377666473388672, 0.0015668272972106934, 0.0017958879470825195, 0.0020249485969543457, 0.002254009246826172, 0.002483069896697998, 0.0027121305465698242, 0.0029411911964416504, 0.0031702518463134766, 0.0033993124961853027, 0.003628373146057129, 0.003857433795928955, 0.004086494445800781, 0.004315555095672607, 0.004544615745544434, 0.00477367639541626, 0.005002737045288086, 0.005231797695159912, 0.005460858345031738, 0.0056899189949035645, 0.005918979644775391, 0.006148040294647217, 0.006377100944519043, 0.006606161594390869, 0.006835222244262695, 0.0070642828941345215, 0.007293343544006348, 0.007522404193878174, 0.00775146484375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 13.0, 13.0, 18.0, 19.0, 24.0, 39.0, 63.0, 81.0, 143.0, 209.0, 317.0, 498.0, 867.0, 1757.0, 3651.0, 9250.0, 28469.0, 126284.0, 626336.0, 191142.0, 38746.0, 11515.0, 4428.0, 2005.0, 1011.0, 552.0, 375.0, 230.0, 148.0, 118.0, 60.0, 39.0, 29.0, 17.0, 20.0, 24.0, 14.0, 8.0, 4.0, 0.0, 3.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00301361083984375, -0.0029151737689971924, -0.0028167366981506348, -0.002718299627304077, -0.0026198625564575195, -0.002521425485610962, -0.0024229884147644043, -0.0023245513439178467, -0.002226114273071289, -0.0021276772022247314, -0.002029240131378174, -0.0019308030605316162, -0.0018323659896850586, -0.001733928918838501, -0.0016354918479919434, -0.0015370547771453857, -0.0014386177062988281, -0.0013401806354522705, -0.0012417435646057129, -0.0011433064937591553, -0.0010448694229125977, -0.00094643235206604, -0.0008479952812194824, -0.0007495582103729248, -0.0006511211395263672, -0.0005526840686798096, -0.00045424699783325195, -0.00035580992698669434, -0.0002573728561401367, -0.0001589357852935791, -6.0498714447021484e-05, 3.793835639953613e-05, 0.00013637542724609375, 0.00023481249809265137, 0.000333249568939209, 0.0004316866397857666, 0.0005301237106323242, 0.0006285607814788818, 0.0007269978523254395, 0.0008254349231719971, 0.0009238719940185547, 0.0010223090648651123, 0.00112074613571167, 0.0012191832065582275, 0.0013176202774047852, 0.0014160573482513428, 0.0015144944190979004, 0.001612931489944458, 0.0017113685607910156, 0.0018098056316375732, 0.0019082427024841309, 0.0020066797733306885, 0.002105116844177246, 0.0022035539150238037, 0.0023019909858703613, 0.002400428056716919, 0.0024988651275634766, 0.002597302198410034, 0.002695739269256592, 0.0027941763401031494, 0.002892613410949707, 0.0029910504817962646, 0.0030894875526428223, 0.00318792462348938, 0.0032863616943359375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 3.0, 4.0, 6.0, 2.0, 10.0, 7.0, 8.0, 17.0, 17.0, 14.0, 33.0, 31.0, 39.0, 45.0, 63.0, 63.0, 110.0, 76.0, 70.0, 73.0, 67.0, 46.0, 31.0, 39.0, 22.0, 16.0, 17.0, 10.0, 6.0, 11.0, 4.0, 4.0, 10.0, 9.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.231401443481445e-05, -8.011888712644577e-05, -7.792375981807709e-05, -7.57286325097084e-05, -7.353350520133972e-05, -7.133837789297104e-05, -6.914325058460236e-05, -6.694812327623367e-05, -6.475299596786499e-05, -6.255786865949631e-05, -6.0362741351127625e-05, -5.816761404275894e-05, -5.597248673439026e-05, -5.3777359426021576e-05, -5.158223211765289e-05, -4.938710480928421e-05, -4.719197750091553e-05, -4.4996850192546844e-05, -4.280172288417816e-05, -4.060659557580948e-05, -3.8411468267440796e-05, -3.621634095907211e-05, -3.402121365070343e-05, -3.182608634233475e-05, -2.9630959033966064e-05, -2.743583172559738e-05, -2.52407044172287e-05, -2.3045577108860016e-05, -2.0850449800491333e-05, -1.865532249212265e-05, -1.6460195183753967e-05, -1.4265067875385284e-05, -1.2069940567016602e-05, -9.874813258647919e-06, -7.679685950279236e-06, -5.484558641910553e-06, -3.28943133354187e-06, -1.0943040251731873e-06, 1.1008232831954956e-06, 3.2959505915641785e-06, 5.491077899932861e-06, 7.686205208301544e-06, 9.881332516670227e-06, 1.207645982503891e-05, 1.4271587133407593e-05, 1.6466714441776276e-05, 1.866184175014496e-05, 2.085696905851364e-05, 2.3052096366882324e-05, 2.5247223675251007e-05, 2.744235098361969e-05, 2.9637478291988373e-05, 3.1832605600357056e-05, 3.402773290872574e-05, 3.622286021709442e-05, 3.8417987525463104e-05, 4.061311483383179e-05, 4.280824214220047e-05, 4.500336945056915e-05, 4.7198496758937836e-05, 4.939362406730652e-05, 5.15887513756752e-05, 5.3783878684043884e-05, 5.597900599241257e-05, 5.817413330078125e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 1.0, 8.0, 7.0, 6.0, 13.0, 20.0, 17.0, 34.0, 51.0, 75.0, 124.0, 159.0, 275.0, 444.0, 833.0, 1536.0, 2988.0, 6361.0, 15062.0, 39603.0, 132141.0, 535323.0, 219344.0, 56969.0, 20546.0, 8441.0, 3779.0, 1908.0, 951.0, 576.0, 316.0, 193.0, 137.0, 82.0, 59.0, 45.0, 21.0, 32.0, 16.0, 16.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0], "bins": [-0.002658843994140625, -0.0025798678398132324, -0.00250089168548584, -0.0024219155311584473, -0.0023429393768310547, -0.002263963222503662, -0.0021849870681762695, -0.002106010913848877, -0.0020270347595214844, -0.0019480586051940918, -0.0018690824508666992, -0.0017901062965393066, -0.001711130142211914, -0.0016321539878845215, -0.001553177833557129, -0.0014742016792297363, -0.0013952255249023438, -0.0013162493705749512, -0.0012372732162475586, -0.001158297061920166, -0.0010793209075927734, -0.0010003447532653809, -0.0009213685989379883, -0.0008423924446105957, -0.0007634162902832031, -0.0006844401359558105, -0.000605463981628418, -0.0005264878273010254, -0.0004475116729736328, -0.00036853551864624023, -0.00028955936431884766, -0.00021058320999145508, -0.0001316070556640625, -5.263090133666992e-05, 2.6345252990722656e-05, 0.00010532140731811523, 0.0001842975616455078, 0.0002632737159729004, 0.00034224987030029297, 0.00042122602462768555, 0.0005002021789550781, 0.0005791783332824707, 0.0006581544876098633, 0.0007371306419372559, 0.0008161067962646484, 0.000895082950592041, 0.0009740591049194336, 0.0010530352592468262, 0.0011320114135742188, 0.0012109875679016113, 0.001289963722229004, 0.0013689398765563965, 0.001447916030883789, 0.0015268921852111816, 0.0016058683395385742, 0.0016848444938659668, 0.0017638206481933594, 0.001842796802520752, 0.0019217729568481445, 0.002000749111175537, 0.0020797252655029297, 0.0021587014198303223, 0.002237677574157715, 0.0023166537284851074, 0.0023956298828125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 9.0, 11.0, 21.0, 12.0, 18.0, 20.0, 18.0, 27.0, 30.0, 36.0, 46.0, 104.0, 119.0, 136.0, 90.0, 57.0, 41.0, 34.0, 30.0, 25.0, 21.0, 15.0, 12.0, 12.0, 10.0, 5.0, 5.0, 7.0, 6.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002979278564453125, -0.0028944015502929688, -0.0028095245361328125, -0.0027246475219726562, -0.0026397705078125, -0.0025548934936523438, -0.0024700164794921875, -0.0023851394653320312, -0.002300262451171875, -0.0022153854370117188, -0.0021305084228515625, -0.0020456314086914062, -0.00196075439453125, -0.0018758773803710938, -0.0017910003662109375, -0.0017061233520507812, -0.001621246337890625, -0.0015363693237304688, -0.0014514923095703125, -0.0013666152954101562, -0.00128173828125, -0.0011968612670898438, -0.0011119842529296875, -0.0010271072387695312, -0.000942230224609375, -0.0008573532104492188, -0.0007724761962890625, -0.0006875991821289062, -0.00060272216796875, -0.0005178451538085938, -0.0004329681396484375, -0.00034809112548828125, -0.000263214111328125, -0.00017833709716796875, -9.34600830078125e-05, -8.58306884765625e-06, 7.62939453125e-05, 0.00016117095947265625, 0.0002460479736328125, 0.00033092498779296875, 0.000415802001953125, 0.0005006790161132812, 0.0005855560302734375, 0.0006704330444335938, 0.00075531005859375, 0.0008401870727539062, 0.0009250640869140625, 0.0010099411010742188, 0.001094818115234375, 0.0011796951293945312, 0.0012645721435546875, 0.0013494491577148438, 0.001434326171875, 0.0015192031860351562, 0.0016040802001953125, 0.0016889572143554688, 0.001773834228515625, 0.0018587112426757812, 0.0019435882568359375, 0.0020284652709960938, 0.00211334228515625, 0.0021982192993164062, 0.0022830963134765625, 0.0023679733276367188, 0.002452850341796875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 7.0, 84.0, 911.0, 12.0, 3.0], "bins": [-0.7076512575149536, -0.6961158514022827, -0.6845804452896118, -0.6730450987815857, -0.6615096926689148, -0.6499742865562439, -0.6384389400482178, -0.6269035339355469, -0.615368127822876, -0.6038327217102051, -0.5922973155975342, -0.5807619690895081, -0.5692265629768372, -0.5576911568641663, -0.5461558103561401, -0.5346204042434692, -0.5230849981307983, -0.5115495920181274, -0.5000141859054565, -0.4884788393974304, -0.4769434332847595, -0.4654080271720886, -0.4538726508617401, -0.4423372745513916, -0.4308018684387207, -0.4192664623260498, -0.4077310860157013, -0.3961957097053528, -0.3846603035926819, -0.373124897480011, -0.3615895211696625, -0.35005414485931396, -0.33851873874664307, -0.32698333263397217, -0.31544795632362366, -0.30391258001327515, -0.29237717390060425, -0.28084176778793335, -0.26930639147758484, -0.25777101516723633, -0.24623560905456543, -0.23470021784305573, -0.22316482663154602, -0.21162943542003632, -0.2000940442085266, -0.1885586529970169, -0.1770232617855072, -0.1654878705739975, -0.1539524793624878, -0.1424170881509781, -0.13088169693946838, -0.11934630572795868, -0.10781091451644897, -0.09627552330493927, -0.08474013209342957, -0.07320474088191986, -0.06166935712099075, -0.05013396590948105, -0.038598574697971344, -0.02706318348646164, -0.015527792274951935, -0.00399240106344223, 0.007542990148067474, 0.01907838135957718, 0.030613774433732033]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 7.0, 10.0, 15.0, 15.0, 16.0, 14.0, 31.0, 36.0, 29.0, 40.0, 30.0, 46.0, 35.0, 56.0, 50.0, 49.0, 55.0, 49.0, 40.0, 50.0, 40.0, 40.0, 35.0, 43.0, 37.0, 28.0, 18.0, 24.0, 18.0, 16.0, 7.0, 12.0, 3.0, 2.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01630920171737671, -0.015610375441610813, -0.014911549165844917, -0.014212722890079021, -0.013513896614313126, -0.01281507033854723, -0.012116244062781334, -0.011417417787015438, -0.010718591511249542, -0.010019765235483646, -0.00932093895971775, -0.008622112683951855, -0.007923286408185959, -0.007224460132420063, -0.006525633856654167, -0.005826807580888271, -0.0051279813051223755, -0.00442915502935648, -0.003730328753590584, -0.003031502477824688, -0.002332676202058792, -0.0016338499262928963, -0.0009350236505270004, -0.00023619737476110458, 0.00046262890100479126, 0.001161455176770687, 0.001860281452536583, 0.002559107728302479, 0.0032579340040683746, 0.0039567602798342705, 0.004655586555600166, 0.005354412831366062, 0.006053239107131958, 0.006752065382897854, 0.00745089165866375, 0.008149717934429646, 0.008848544210195541, 0.009547370485961437, 0.010246196761727333, 0.010945023037493229, 0.011643849313259125, 0.01234267558902502, 0.013041501864790916, 0.013740328140556812, 0.014439154416322708, 0.015137980692088604, 0.0158368069678545, 0.01653563231229782, 0.01723445951938629, 0.017933286726474762, 0.018632112070918083, 0.019330937415361404, 0.020029764622449875, 0.020728591829538345, 0.021427417173981667, 0.022126242518424988, 0.022825069725513458, 0.02352389693260193, 0.02422272227704525, 0.02492154762148857, 0.02562037482857704, 0.026319202035665512, 0.027018027380108833, 0.027716852724552155, 0.028415679931640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 9.0, 2.0, 9.0, 7.0, 8.0, 9.0, 14.0, 21.0, 40.0, 46.0, 75.0, 128.0, 144.0, 329.0, 1621.0, 6127.0, 177861.0, 3985937.0, 16972.0, 2787.0, 964.0, 545.0, 364.0, 157.0, 38.0, 20.0, 12.0, 12.0, 9.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0187530517578125, -0.01822078227996826, -0.017688512802124023, -0.017156243324279785, -0.016623973846435547, -0.01609170436859131, -0.01555943489074707, -0.015027165412902832, -0.014494895935058594, -0.013962626457214355, -0.013430356979370117, -0.012898087501525879, -0.01236581802368164, -0.011833548545837402, -0.011301279067993164, -0.010769009590148926, -0.010236740112304688, -0.00970447063446045, -0.009172201156616211, -0.008639931678771973, -0.008107662200927734, -0.007575392723083496, -0.007043123245239258, -0.0065108537673950195, -0.005978584289550781, -0.005446314811706543, -0.004914045333862305, -0.004381775856018066, -0.003849506378173828, -0.00331723690032959, -0.0027849674224853516, -0.0022526979446411133, -0.001720428466796875, -0.0011881589889526367, -0.0006558895111083984, -0.00012362003326416016, 0.0004086494445800781, 0.0009409189224243164, 0.0014731884002685547, 0.002005457878112793, 0.0025377273559570312, 0.0030699968338012695, 0.003602266311645508, 0.004134535789489746, 0.004666805267333984, 0.005199074745178223, 0.005731344223022461, 0.006263613700866699, 0.0067958831787109375, 0.007328152656555176, 0.007860422134399414, 0.008392691612243652, 0.00892496109008789, 0.009457230567932129, 0.009989500045776367, 0.010521769523620605, 0.011054039001464844, 0.011586308479309082, 0.01211857795715332, 0.012650847434997559, 0.013183116912841797, 0.013715386390686035, 0.014247655868530273, 0.014779925346374512, 0.01531219482421875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 11.0, 75.0, 234.0, 399.0, 220.0, 65.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0221405029296875, -0.02161872386932373, -0.02109694480895996, -0.02057516574859619, -0.020053386688232422, -0.019531607627868652, -0.019009828567504883, -0.018488049507141113, -0.017966270446777344, -0.017444491386413574, -0.016922712326049805, -0.016400933265686035, -0.015879154205322266, -0.015357375144958496, -0.014835596084594727, -0.014313817024230957, -0.013792037963867188, -0.013270258903503418, -0.012748479843139648, -0.012226700782775879, -0.01170492172241211, -0.01118314266204834, -0.01066136360168457, -0.0101395845413208, -0.009617805480957031, -0.009096026420593262, -0.008574247360229492, -0.008052468299865723, -0.007530689239501953, -0.007008910179138184, -0.006487131118774414, -0.0059653520584106445, -0.005443572998046875, -0.0049217939376831055, -0.004400014877319336, -0.0038782358169555664, -0.003356456756591797, -0.0028346776962280273, -0.002312898635864258, -0.0017911195755004883, -0.0012693405151367188, -0.0007475614547729492, -0.0002257823944091797, 0.00029599666595458984, 0.0008177757263183594, 0.001339554786682129, 0.0018613338470458984, 0.002383112907409668, 0.0029048919677734375, 0.003426671028137207, 0.0039484500885009766, 0.004470229148864746, 0.004992008209228516, 0.005513787269592285, 0.006035566329956055, 0.006557345390319824, 0.007079124450683594, 0.007600903511047363, 0.008122682571411133, 0.008644461631774902, 0.009166240692138672, 0.009688019752502441, 0.010209798812866211, 0.01073157787322998, 0.01125335693359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 4.0, 5.0, 14.0, 25.0, 25.0, 47.0, 73.0, 136.0, 214.0, 362.0, 628.0, 1131.0, 2450.0, 5804.0, 16597.0, 62233.0, 432604.0, 3391249.0, 216797.0, 42435.0, 12577.0, 4465.0, 1979.0, 1039.0, 584.0, 283.0, 179.0, 121.0, 68.0, 55.0, 31.0, 20.0, 12.0, 14.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.0046539306640625, -0.0045185089111328125, -0.004383087158203125, -0.0042476654052734375, -0.00411224365234375, -0.0039768218994140625, -0.003841400146484375, -0.0037059783935546875, -0.003570556640625, -0.0034351348876953125, -0.003299713134765625, -0.0031642913818359375, -0.00302886962890625, -0.0028934478759765625, -0.002758026123046875, -0.0026226043701171875, -0.0024871826171875, -0.0023517608642578125, -0.002216339111328125, -0.0020809173583984375, -0.00194549560546875, -0.0018100738525390625, -0.001674652099609375, -0.0015392303466796875, -0.00140380859375, -0.0012683868408203125, -0.001132965087890625, -0.0009975433349609375, -0.00086212158203125, -0.0007266998291015625, -0.000591278076171875, -0.0004558563232421875, -0.0003204345703125, -0.0001850128173828125, -4.9591064453125e-05, 8.58306884765625e-05, 0.00022125244140625, 0.0003566741943359375, 0.000492095947265625, 0.0006275177001953125, 0.000762939453125, 0.0008983612060546875, 0.001033782958984375, 0.0011692047119140625, 0.00130462646484375, 0.0014400482177734375, 0.001575469970703125, 0.0017108917236328125, 0.0018463134765625, 0.0019817352294921875, 0.002117156982421875, 0.0022525787353515625, 0.00238800048828125, 0.0025234222412109375, 0.002658843994140625, 0.0027942657470703125, 0.0029296875, 0.0030651092529296875, 0.003200531005859375, 0.0033359527587890625, 0.00347137451171875, 0.0036067962646484375, 0.003742218017578125, 0.0038776397705078125, 0.0040130615234375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 11.0, 11.0, 11.0, 22.0, 31.0, 46.0, 83.0, 152.0, 467.0, 1291.0, 1157.0, 382.0, 136.0, 89.0, 63.0, 36.0, 26.0, 17.0, 16.0, 7.0, 4.0, 8.0, 1.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00409698486328125, -0.003939449787139893, -0.003781914710998535, -0.0036243796348571777, -0.0034668445587158203, -0.003309309482574463, -0.0031517744064331055, -0.002994239330291748, -0.0028367042541503906, -0.002679169178009033, -0.0025216341018676758, -0.0023640990257263184, -0.002206563949584961, -0.0020490288734436035, -0.001891493797302246, -0.0017339587211608887, -0.0015764236450195312, -0.0014188885688781738, -0.0012613534927368164, -0.001103818416595459, -0.0009462833404541016, -0.0007887482643127441, -0.0006312131881713867, -0.0004736781120300293, -0.0003161430358886719, -0.00015860795974731445, -1.0728836059570312e-06, 0.0001564621925354004, 0.0003139972686767578, 0.00047153234481811523, 0.0006290674209594727, 0.0007866024971008301, 0.0009441375732421875, 0.001101672649383545, 0.0012592077255249023, 0.0014167428016662598, 0.0015742778778076172, 0.0017318129539489746, 0.001889348030090332, 0.0020468831062316895, 0.002204418182373047, 0.0023619532585144043, 0.0025194883346557617, 0.002677023410797119, 0.0028345584869384766, 0.002992093563079834, 0.0031496286392211914, 0.003307163715362549, 0.0034646987915039062, 0.0036222338676452637, 0.003779768943786621, 0.0039373040199279785, 0.004094839096069336, 0.004252374172210693, 0.004409909248352051, 0.004567444324493408, 0.004724979400634766, 0.004882514476776123, 0.0050400495529174805, 0.005197584629058838, 0.005355119705200195, 0.005512654781341553, 0.00567018985748291, 0.005827724933624268, 0.005985260009765625]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 10.0, 56.0, 344.0, 475.0, 98.0, 20.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022165531292557716, -0.020169777795672417, -0.018174026161432266, -0.016178272664546967, -0.014182519167661667, -0.012186765670776367, -0.010191013105213642, -0.008195260539650917, -0.006199507042765617, -0.004203754011541605, -0.0022080009803175926, -0.00021224794909358025, 0.0017835050821304321, 0.003779258579015732, 0.005775011144578457, 0.007770763710141182, 0.009766517207026482, 0.011762270703911781, 0.013758023269474506, 0.01575377583503723, 0.01774952933192253, 0.01974528282880783, 0.02174103632569313, 0.02373678795993328, 0.02573254145681858, 0.02772829495370388, 0.02972404658794403, 0.03171980008482933, 0.03371555358171463, 0.03571130707859993, 0.03770706057548523, 0.03970281034708023, 0.04169856011867523, 0.04369431361556053, 0.04569006711244583, 0.04768582060933113, 0.04968157410621643, 0.05167732387781143, 0.05367307737469673, 0.05566883087158203, 0.05766458436846733, 0.05966033786535263, 0.06165609136223793, 0.06365184485912323, 0.06564759463071823, 0.06764335185289383, 0.06963910162448883, 0.07163485884666443, 0.07363060861825943, 0.07562635838985443, 0.07762211561203003, 0.07961786538362503, 0.08161362260580063, 0.08360937237739563, 0.08560512959957123, 0.08760087937116623, 0.08959662914276123, 0.09159237891435623, 0.09358813613653183, 0.09558388590812683, 0.09757964313030243, 0.09957539290189743, 0.10157115012407303, 0.10356689989566803, 0.10556265711784363]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 12.0, 11.0, 14.0, 15.0, 24.0, 23.0, 25.0, 30.0, 48.0, 49.0, 42.0, 45.0, 66.0, 44.0, 48.0, 41.0, 66.0, 58.0, 48.0, 42.0, 39.0, 41.0, 25.0, 33.0, 17.0, 14.0, 16.0, 8.0, 15.0, 11.0, 4.0, 3.0, 5.0, 2.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.013563811779022217, -0.013193903490900993, -0.01282399520277977, -0.012454086914658546, -0.012084178626537323, -0.0117142703384161, -0.011344362050294876, -0.010974453762173653, -0.01060454547405243, -0.010234637185931206, -0.009864728897809982, -0.009494820609688759, -0.009124912321567535, -0.008755004033446312, -0.008385095745325089, -0.008015187457203865, -0.007645279169082642, -0.007275370880961418, -0.006905462592840195, -0.006535554304718971, -0.006165646016597748, -0.005795737728476524, -0.005425829440355301, -0.0050559211522340775, -0.004686012864112854, -0.0043161045759916306, -0.003946196287870407, -0.0035762879997491837, -0.00320637971162796, -0.0028364714235067368, -0.0024665631353855133, -0.00209665484726429, -0.0017267465591430664, -0.001356838271021843, -0.0009869299829006195, -0.0006170216947793961, -0.0002471134066581726, 0.00012279488146305084, 0.0004927031695842743, 0.0008626114577054977, 0.0012325197458267212, 0.0016024280339479446, 0.001972336322069168, 0.0023422446101903915, 0.002712152898311615, 0.0030820611864328384, 0.003451969474554062, 0.0038218777626752853, 0.004191786050796509, 0.004561694338917732, 0.004931602627038956, 0.005301510915160179, 0.005671419203281403, 0.006041327491402626, 0.0064112357795238495, 0.006781144067645073, 0.007151052355766296, 0.00752096064388752, 0.007890868932008743, 0.008260777220129967, 0.00863068550825119, 0.009000593796372414, 0.009370502084493637, 0.00974041037261486, 0.010110318660736084]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 6.0, 7.0, 10.0, 10.0, 15.0, 24.0, 26.0, 29.0, 41.0, 64.0, 104.0, 156.0, 259.0, 437.0, 784.0, 1989.0, 18578.0, 903130.0, 116314.0, 4027.0, 1090.0, 563.0, 311.0, 186.0, 121.0, 62.0, 68.0, 39.0, 32.0, 12.0, 13.0, 9.0, 8.0, 6.0, 7.0, 3.0, 3.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0251007080078125, -0.024397850036621094, -0.023694992065429688, -0.02299213409423828, -0.022289276123046875, -0.02158641815185547, -0.020883560180664062, -0.020180702209472656, -0.01947784423828125, -0.018774986267089844, -0.018072128295898438, -0.01736927032470703, -0.016666412353515625, -0.01596355438232422, -0.015260696411132812, -0.014557838439941406, -0.01385498046875, -0.013152122497558594, -0.012449264526367188, -0.011746406555175781, -0.011043548583984375, -0.010340690612792969, -0.009637832641601562, -0.008934974670410156, -0.00823211669921875, -0.007529258728027344, -0.0068264007568359375, -0.006123542785644531, -0.005420684814453125, -0.004717826843261719, -0.0040149688720703125, -0.0033121109008789062, -0.0026092529296875, -0.0019063949584960938, -0.0012035369873046875, -0.0005006790161132812, 0.000202178955078125, 0.0009050369262695312, 0.0016078948974609375, 0.0023107528686523438, 0.00301361083984375, 0.0037164688110351562, 0.0044193267822265625, 0.005122184753417969, 0.005825042724609375, 0.006527900695800781, 0.0072307586669921875, 0.007933616638183594, 0.008636474609375, 0.009339332580566406, 0.010042190551757812, 0.010745048522949219, 0.011447906494140625, 0.012150764465332031, 0.012853622436523438, 0.013556480407714844, 0.01425933837890625, 0.014962196350097656, 0.015665054321289062, 0.01636791229248047, 0.017070770263671875, 0.01777362823486328, 0.018476486206054688, 0.019179344177246094, 0.0198822021484375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 5.0, 34.0, 176.0, 402.0, 282.0, 95.0, 13.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0224151611328125, -0.021890759468078613, -0.021366357803344727, -0.02084195613861084, -0.020317554473876953, -0.019793152809143066, -0.01926875114440918, -0.018744349479675293, -0.018219947814941406, -0.01769554615020752, -0.017171144485473633, -0.016646742820739746, -0.01612234115600586, -0.015597939491271973, -0.015073537826538086, -0.0145491361618042, -0.014024734497070312, -0.013500332832336426, -0.012975931167602539, -0.012451529502868652, -0.011927127838134766, -0.011402726173400879, -0.010878324508666992, -0.010353922843933105, -0.009829521179199219, -0.009305119514465332, -0.008780717849731445, -0.008256316184997559, -0.007731914520263672, -0.007207512855529785, -0.0066831111907958984, -0.006158709526062012, -0.005634307861328125, -0.005109906196594238, -0.0045855045318603516, -0.004061102867126465, -0.003536701202392578, -0.0030122995376586914, -0.0024878978729248047, -0.001963496208190918, -0.0014390945434570312, -0.0009146928787231445, -0.0003902912139892578, 0.0001341104507446289, 0.0006585121154785156, 0.0011829137802124023, 0.001707315444946289, 0.0022317171096801758, 0.0027561187744140625, 0.0032805204391479492, 0.003804922103881836, 0.004329323768615723, 0.004853725433349609, 0.005378127098083496, 0.005902528762817383, 0.0064269304275512695, 0.006951332092285156, 0.007475733757019043, 0.00800013542175293, 0.008524537086486816, 0.009048938751220703, 0.00957334041595459, 0.010097742080688477, 0.010622143745422363, 0.01114654541015625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 4.0, 1.0, 3.0, 9.0, 7.0, 10.0, 18.0, 31.0, 51.0, 51.0, 102.0, 152.0, 260.0, 472.0, 928.0, 2069.0, 5016.0, 15931.0, 75568.0, 409942.0, 430737.0, 80984.0, 16800.0, 5211.0, 2031.0, 1008.0, 488.0, 237.0, 153.0, 91.0, 60.0, 38.0, 25.0, 25.0, 14.0, 15.0, 5.0, 2.0, 3.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.007167816162109375, -0.006950736045837402, -0.00673365592956543, -0.006516575813293457, -0.006299495697021484, -0.006082415580749512, -0.005865335464477539, -0.005648255348205566, -0.005431175231933594, -0.005214095115661621, -0.0049970149993896484, -0.004779934883117676, -0.004562854766845703, -0.0043457746505737305, -0.004128694534301758, -0.003911614418029785, -0.0036945343017578125, -0.00347745418548584, -0.003260374069213867, -0.0030432939529418945, -0.002826213836669922, -0.0026091337203979492, -0.0023920536041259766, -0.002174973487854004, -0.0019578933715820312, -0.0017408132553100586, -0.001523733139038086, -0.0013066530227661133, -0.0010895729064941406, -0.000872492790222168, -0.0006554126739501953, -0.00043833255767822266, -0.00022125244140625, -4.172325134277344e-06, 0.0002129077911376953, 0.00042998790740966797, 0.0006470680236816406, 0.0008641481399536133, 0.001081228256225586, 0.0012983083724975586, 0.0015153884887695312, 0.001732468605041504, 0.0019495487213134766, 0.0021666288375854492, 0.002383708953857422, 0.0026007890701293945, 0.002817869186401367, 0.00303494930267334, 0.0032520294189453125, 0.003469109535217285, 0.003686189651489258, 0.0039032697677612305, 0.004120349884033203, 0.004337430000305176, 0.0045545101165771484, 0.004771590232849121, 0.004988670349121094, 0.005205750465393066, 0.005422830581665039, 0.005639910697937012, 0.005856990814208984, 0.006074070930480957, 0.00629115104675293, 0.006508231163024902, 0.006725311279296875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 5.0, 6.0, 8.0, 2.0, 3.0, 7.0, 8.0, 20.0, 27.0, 28.0, 42.0, 38.0, 41.0, 59.0, 62.0, 59.0, 58.0, 65.0, 57.0, 58.0, 55.0, 47.0, 51.0, 30.0, 31.0, 29.0, 16.0, 28.0, 18.0, 13.0, 7.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00814056396484375, -0.007881879806518555, -0.007623195648193359, -0.007364511489868164, -0.007105827331542969, -0.0068471431732177734, -0.006588459014892578, -0.006329774856567383, -0.0060710906982421875, -0.005812406539916992, -0.005553722381591797, -0.0052950382232666016, -0.005036354064941406, -0.004777669906616211, -0.004518985748291016, -0.00426030158996582, -0.004001617431640625, -0.0037429332733154297, -0.0034842491149902344, -0.003225564956665039, -0.0029668807983398438, -0.0027081966400146484, -0.002449512481689453, -0.002190828323364258, -0.0019321441650390625, -0.0016734600067138672, -0.0014147758483886719, -0.0011560916900634766, -0.0008974075317382812, -0.0006387233734130859, -0.0003800392150878906, -0.00012135505676269531, 0.0001373291015625, 0.0003960132598876953, 0.0006546974182128906, 0.0009133815765380859, 0.0011720657348632812, 0.0014307498931884766, 0.0016894340515136719, 0.0019481182098388672, 0.0022068023681640625, 0.002465486526489258, 0.002724170684814453, 0.0029828548431396484, 0.0032415390014648438, 0.003500223159790039, 0.0037589073181152344, 0.00401759147644043, 0.004276275634765625, 0.00453495979309082, 0.004793643951416016, 0.005052328109741211, 0.005311012268066406, 0.0055696964263916016, 0.005828380584716797, 0.006087064743041992, 0.0063457489013671875, 0.006604433059692383, 0.006863117218017578, 0.0071218013763427734, 0.007380485534667969, 0.007639169692993164, 0.00789785385131836, 0.008156538009643555, 0.00841522216796875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 4.0, 7.0, 6.0, 14.0, 15.0, 21.0, 30.0, 44.0, 51.0, 75.0, 91.0, 173.0, 246.0, 358.0, 543.0, 858.0, 1492.0, 2755.0, 5295.0, 11875.0, 40208.0, 312044.0, 576224.0, 65352.0, 16302.0, 6537.0, 3236.0, 1756.0, 1037.0, 607.0, 439.0, 260.0, 184.0, 110.0, 88.0, 66.0, 44.0, 21.0, 27.0, 19.0, 13.0, 12.0, 6.0, 5.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.004177093505859375, -0.0040471553802490234, -0.003917217254638672, -0.0037872791290283203, -0.0036573410034179688, -0.003527402877807617, -0.0033974647521972656, -0.003267526626586914, -0.0031375885009765625, -0.003007650375366211, -0.0028777122497558594, -0.002747774124145508, -0.0026178359985351562, -0.0024878978729248047, -0.002357959747314453, -0.0022280216217041016, -0.00209808349609375, -0.0019681453704833984, -0.0018382072448730469, -0.0017082691192626953, -0.0015783309936523438, -0.0014483928680419922, -0.0013184547424316406, -0.001188516616821289, -0.0010585784912109375, -0.0009286403656005859, -0.0007987022399902344, -0.0006687641143798828, -0.0005388259887695312, -0.0004088878631591797, -0.0002789497375488281, -0.00014901161193847656, -1.9073486328125e-05, 0.00011086463928222656, 0.00024080276489257812, 0.0003707408905029297, 0.0005006790161132812, 0.0006306171417236328, 0.0007605552673339844, 0.0008904933929443359, 0.0010204315185546875, 0.001150369644165039, 0.0012803077697753906, 0.0014102458953857422, 0.0015401840209960938, 0.0016701221466064453, 0.0018000602722167969, 0.0019299983978271484, 0.0020599365234375, 0.0021898746490478516, 0.002319812774658203, 0.0024497509002685547, 0.0025796890258789062, 0.002709627151489258, 0.0028395652770996094, 0.002969503402709961, 0.0030994415283203125, 0.003229379653930664, 0.0033593177795410156, 0.003489255905151367, 0.0036191940307617188, 0.0037491321563720703, 0.003879070281982422, 0.0040090084075927734, 0.004138946533203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 1.0, 7.0, 11.0, 17.0, 14.0, 18.0, 18.0, 26.0, 38.0, 39.0, 75.0, 91.0, 136.0, 147.0, 90.0, 78.0, 49.0, 29.0, 28.0, 25.0, 22.0, 15.0, 8.0, 7.0, 3.0, 5.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000164031982421875, -0.000158749520778656, -0.000153467059135437, -0.00014818459749221802, -0.00014290213584899902, -0.00013761967420578003, -0.00013233721256256104, -0.00012705475091934204, -0.00012177228927612305, -0.00011648982763290405, -0.00011120736598968506, -0.00010592490434646606, -0.00010064244270324707, -9.535998106002808e-05, -9.007751941680908e-05, -8.479505777359009e-05, -7.95125961303711e-05, -7.42301344871521e-05, -6.89476728439331e-05, -6.366521120071411e-05, -5.838274955749512e-05, -5.310028791427612e-05, -4.781782627105713e-05, -4.2535364627838135e-05, -3.725290298461914e-05, -3.1970441341400146e-05, -2.6687979698181152e-05, -2.1405518054962158e-05, -1.6123056411743164e-05, -1.084059476852417e-05, -5.558133125305176e-06, -2.7567148208618164e-07, 5.0067901611328125e-06, 1.0289251804351807e-05, 1.55717134475708e-05, 2.0854175090789795e-05, 2.613663673400879e-05, 3.141909837722778e-05, 3.670156002044678e-05, 4.198402166366577e-05, 4.7266483306884766e-05, 5.254894495010376e-05, 5.7831406593322754e-05, 6.311386823654175e-05, 6.839632987976074e-05, 7.367879152297974e-05, 7.896125316619873e-05, 8.424371480941772e-05, 8.952617645263672e-05, 9.480863809585571e-05, 0.00010009109973907471, 0.0001053735613822937, 0.0001106560230255127, 0.00011593848466873169, 0.00012122094631195068, 0.00012650340795516968, 0.00013178586959838867, 0.00013706833124160767, 0.00014235079288482666, 0.00014763325452804565, 0.00015291571617126465, 0.00015819817781448364, 0.00016348063945770264, 0.00016876310110092163, 0.00017404556274414062]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 11.0, 6.0, 14.0, 31.0, 34.0, 53.0, 74.0, 144.0, 245.0, 383.0, 726.0, 1525.0, 3683.0, 10636.0, 50507.0, 812277.0, 141562.0, 17145.0, 5265.0, 2038.0, 955.0, 492.0, 268.0, 190.0, 94.0, 53.0, 49.0, 28.0, 24.0, 17.0, 3.0, 5.0, 2.0, 7.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007236480712890625, -0.007021665573120117, -0.006806850433349609, -0.0065920352935791016, -0.006377220153808594, -0.006162405014038086, -0.005947589874267578, -0.00573277473449707, -0.0055179595947265625, -0.005303144454956055, -0.005088329315185547, -0.004873514175415039, -0.004658699035644531, -0.0044438838958740234, -0.004229068756103516, -0.004014253616333008, -0.0037994384765625, -0.003584623336791992, -0.0033698081970214844, -0.0031549930572509766, -0.0029401779174804688, -0.002725362777709961, -0.002510547637939453, -0.0022957324981689453, -0.0020809173583984375, -0.0018661022186279297, -0.0016512870788574219, -0.001436471939086914, -0.0012216567993164062, -0.0010068416595458984, -0.0007920265197753906, -0.0005772113800048828, -0.000362396240234375, -0.0001475811004638672, 6.723403930664062e-05, 0.00028204917907714844, 0.0004968643188476562, 0.0007116794586181641, 0.0009264945983886719, 0.0011413097381591797, 0.0013561248779296875, 0.0015709400177001953, 0.0017857551574707031, 0.002000570297241211, 0.0022153854370117188, 0.0024302005767822266, 0.0026450157165527344, 0.002859830856323242, 0.00307464599609375, 0.003289461135864258, 0.0035042762756347656, 0.0037190914154052734, 0.003933906555175781, 0.004148721694946289, 0.004363536834716797, 0.004578351974487305, 0.0047931671142578125, 0.00500798225402832, 0.005222797393798828, 0.005437612533569336, 0.005652427673339844, 0.0058672428131103516, 0.006082057952880859, 0.006296873092651367, 0.006511688232421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 3.0, 6.0, 5.0, 9.0, 16.0, 23.0, 17.0, 28.0, 47.0, 75.0, 170.0, 235.0, 149.0, 54.0, 47.0, 25.0, 21.0, 15.0, 9.0, 7.0, 2.0, 8.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00460052490234375, -0.004458427429199219, -0.0043163299560546875, -0.004174232482910156, -0.004032135009765625, -0.0038900375366210938, -0.0037479400634765625, -0.0036058425903320312, -0.0034637451171875, -0.0033216476440429688, -0.0031795501708984375, -0.0030374526977539062, -0.002895355224609375, -0.0027532577514648438, -0.0026111602783203125, -0.0024690628051757812, -0.00232696533203125, -0.0021848678588867188, -0.0020427703857421875, -0.0019006729125976562, -0.001758575439453125, -0.0016164779663085938, -0.0014743804931640625, -0.0013322830200195312, -0.001190185546875, -0.0010480880737304688, -0.0009059906005859375, -0.0007638931274414062, -0.000621795654296875, -0.00047969818115234375, -0.0003376007080078125, -0.00019550323486328125, -5.340576171875e-05, 8.869171142578125e-05, 0.0002307891845703125, 0.00037288665771484375, 0.000514984130859375, 0.0006570816040039062, 0.0007991790771484375, 0.0009412765502929688, 0.0010833740234375, 0.0012254714965820312, 0.0013675689697265625, 0.0015096664428710938, 0.001651763916015625, 0.0017938613891601562, 0.0019359588623046875, 0.0020780563354492188, 0.00222015380859375, 0.0023622512817382812, 0.0025043487548828125, 0.0026464462280273438, 0.002788543701171875, 0.0029306411743164062, 0.0030727386474609375, 0.0032148361206054688, 0.00335693359375, 0.0034990310668945312, 0.0036411285400390625, 0.0037832260131835938, 0.003925323486328125, 0.004067420959472656, 0.0042095184326171875, 0.004351615905761719, 0.00449371337890625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 12.0, 354.0, 587.0, 47.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.36001256108283997, -0.35347074270248413, -0.3469288945198059, -0.3403870761394501, -0.33384522795677185, -0.327303409576416, -0.3207615613937378, -0.31421974301338196, -0.30767789483070374, -0.3011360764503479, -0.2945942282676697, -0.28805240988731384, -0.2815105617046356, -0.2749687433242798, -0.26842689514160156, -0.2618850767612457, -0.2553432285785675, -0.24880139529705048, -0.24225956201553345, -0.23571772873401642, -0.2291758954524994, -0.22263406217098236, -0.21609222888946533, -0.2095503956079483, -0.20300857722759247, -0.19646674394607544, -0.1899249106645584, -0.18338307738304138, -0.17684124410152435, -0.17029941082000732, -0.1637575775384903, -0.15721574425697327, -0.15067392587661743, -0.1441320925951004, -0.13759025931358337, -0.13104842603206635, -0.12450659275054932, -0.11796475946903229, -0.11142292618751526, -0.10488109290599823, -0.0983392596244812, -0.09179742634296417, -0.08525559306144714, -0.07871375977993011, -0.07217192649841309, -0.06563009321689606, -0.05908826366066933, -0.0525464303791523, -0.04600459337234497, -0.03946276009082794, -0.03292092680931091, -0.026379095390439034, -0.019837262108922005, -0.013295430690050125, -0.006753597408533096, -0.0002117641270160675, 0.006330069154500961, 0.01287190243601799, 0.01941373571753502, 0.0259555671364069, 0.03249739855527878, 0.03903923183679581, 0.045581065118312836, 0.052122898399829865, 0.05866473168134689]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 9.0, 14.0, 3.0, 10.0, 17.0, 16.0, 27.0, 15.0, 21.0, 24.0, 36.0, 42.0, 44.0, 37.0, 36.0, 42.0, 43.0, 49.0, 55.0, 46.0, 44.0, 52.0, 47.0, 34.0, 30.0, 33.0, 34.0, 20.0, 21.0, 19.0, 20.0, 13.0, 13.0, 9.0, 5.0, 3.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.022184371948242188, -0.02154526673257351, -0.02090616151690483, -0.020267056301236153, -0.019627951085567474, -0.018988845869898796, -0.018349740654230118, -0.01771063543856144, -0.01707153022289276, -0.016432425007224083, -0.015793319791555405, -0.015154214575886726, -0.014515109360218048, -0.01387600414454937, -0.013236898928880692, -0.012597793713212013, -0.011958688497543335, -0.011319583281874657, -0.010680478066205978, -0.0100413728505373, -0.009402267634868622, -0.008763162419199944, -0.008124057203531265, -0.007484951987862587, -0.006845846772193909, -0.00620674155652523, -0.005567636340856552, -0.004928531125187874, -0.0042894259095191956, -0.0036503206938505173, -0.003011215478181839, -0.0023721102625131607, -0.0017330050468444824, -0.0010938998311758041, -0.00045479461550712585, 0.00018431060016155243, 0.0008234158158302307, 0.001462521031498909, 0.0021016262471675873, 0.0027407314628362656, 0.003379836678504944, 0.004018941894173622, 0.0046580471098423, 0.005297152325510979, 0.005936257541179657, 0.006575362756848335, 0.0072144679725170135, 0.007853573188185692, 0.00849267840385437, 0.009131783619523048, 0.009770888835191727, 0.010409994050860405, 0.011049099266529083, 0.011688204482197762, 0.01232730969786644, 0.012966414913535118, 0.013605520129203796, 0.014244625344872475, 0.014883730560541153, 0.015522835776209831, 0.01616194099187851, 0.016801046207547188, 0.017440151423215866, 0.018079256638884544, 0.018718361854553223]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 9.0, 9.0, 14.0, 16.0, 18.0, 28.0, 55.0, 103.0, 163.0, 422.0, 2535.0, 28931.0, 4139991.0, 18411.0, 2076.0, 892.0, 447.0, 78.0, 30.0, 21.0, 14.0, 8.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0246429443359375, -0.023883581161499023, -0.023124217987060547, -0.02236485481262207, -0.021605491638183594, -0.020846128463745117, -0.02008676528930664, -0.019327402114868164, -0.018568038940429688, -0.01780867576599121, -0.017049312591552734, -0.016289949417114258, -0.015530586242675781, -0.014771223068237305, -0.014011859893798828, -0.013252496719360352, -0.012493133544921875, -0.011733770370483398, -0.010974407196044922, -0.010215044021606445, -0.009455680847167969, -0.008696317672729492, -0.007936954498291016, -0.007177591323852539, -0.0064182281494140625, -0.005658864974975586, -0.004899501800537109, -0.004140138626098633, -0.0033807754516601562, -0.0026214122772216797, -0.0018620491027832031, -0.0011026859283447266, -0.00034332275390625, 0.00041604042053222656, 0.0011754035949707031, 0.0019347667694091797, 0.0026941299438476562, 0.003453493118286133, 0.004212856292724609, 0.004972219467163086, 0.0057315826416015625, 0.006490945816040039, 0.007250308990478516, 0.008009672164916992, 0.008769035339355469, 0.009528398513793945, 0.010287761688232422, 0.011047124862670898, 0.011806488037109375, 0.012565851211547852, 0.013325214385986328, 0.014084577560424805, 0.014843940734863281, 0.015603303909301758, 0.016362667083740234, 0.01712203025817871, 0.017881393432617188, 0.018640756607055664, 0.01940011978149414, 0.020159482955932617, 0.020918846130371094, 0.02167820930480957, 0.022437572479248047, 0.023196935653686523, 0.023956298828125]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 22.0, 139.0, 360.0, 350.0, 117.0, 16.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0230255126953125, -0.022489190101623535, -0.02195286750793457, -0.021416544914245605, -0.02088022232055664, -0.020343899726867676, -0.01980757713317871, -0.019271254539489746, -0.01873493194580078, -0.018198609352111816, -0.01766228675842285, -0.017125964164733887, -0.016589641571044922, -0.016053318977355957, -0.015516996383666992, -0.014980673789978027, -0.014444351196289062, -0.013908028602600098, -0.013371706008911133, -0.012835383415222168, -0.012299060821533203, -0.011762738227844238, -0.011226415634155273, -0.010690093040466309, -0.010153770446777344, -0.009617447853088379, -0.009081125259399414, -0.00854480266571045, -0.008008480072021484, -0.0074721574783325195, -0.006935834884643555, -0.00639951229095459, -0.005863189697265625, -0.00532686710357666, -0.004790544509887695, -0.0042542219161987305, -0.0037178993225097656, -0.0031815767288208008, -0.002645254135131836, -0.002108931541442871, -0.0015726089477539062, -0.0010362863540649414, -0.0004999637603759766, 3.635883331298828e-05, 0.0005726814270019531, 0.001109004020690918, 0.0016453266143798828, 0.0021816492080688477, 0.0027179718017578125, 0.0032542943954467773, 0.003790616989135742, 0.004326939582824707, 0.004863262176513672, 0.005399584770202637, 0.0059359073638916016, 0.006472229957580566, 0.007008552551269531, 0.007544875144958496, 0.008081197738647461, 0.008617520332336426, 0.00915384292602539, 0.009690165519714355, 0.01022648811340332, 0.010762810707092285, 0.01129913330078125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 6.0, 10.0, 9.0, 12.0, 15.0, 29.0, 27.0, 35.0, 64.0, 132.0, 207.0, 412.0, 1008.0, 2796.0, 13013.0, 193093.0, 3902829.0, 69586.0, 7474.0, 1983.0, 723.0, 339.0, 175.0, 97.0, 76.0, 38.0, 29.0, 17.0, 13.0, 17.0, 8.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009033203125, -0.008702874183654785, -0.00837254524230957, -0.008042216300964355, -0.007711887359619141, -0.007381558418273926, -0.007051229476928711, -0.006720900535583496, -0.006390571594238281, -0.006060242652893066, -0.0057299137115478516, -0.005399584770202637, -0.005069255828857422, -0.004738926887512207, -0.004408597946166992, -0.004078269004821777, -0.0037479400634765625, -0.0034176111221313477, -0.003087282180786133, -0.002756953239440918, -0.002426624298095703, -0.0020962953567504883, -0.0017659664154052734, -0.0014356374740600586, -0.0011053085327148438, -0.0007749795913696289, -0.00044465065002441406, -0.00011432170867919922, 0.00021600723266601562, 0.0005463361740112305, 0.0008766651153564453, 0.0012069940567016602, 0.001537322998046875, 0.0018676519393920898, 0.0021979808807373047, 0.0025283098220825195, 0.0028586387634277344, 0.0031889677047729492, 0.003519296646118164, 0.003849625587463379, 0.004179954528808594, 0.004510283470153809, 0.0048406124114990234, 0.005170941352844238, 0.005501270294189453, 0.005831599235534668, 0.006161928176879883, 0.006492257118225098, 0.0068225860595703125, 0.007152915000915527, 0.007483243942260742, 0.007813572883605957, 0.008143901824951172, 0.008474230766296387, 0.008804559707641602, 0.009134888648986816, 0.009465217590332031, 0.009795546531677246, 0.010125875473022461, 0.010456204414367676, 0.01078653335571289, 0.011116862297058105, 0.01144719123840332, 0.011777520179748535, 0.01210784912109375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 16.0, 22.0, 51.0, 145.0, 606.0, 2562.0, 440.0, 115.0, 62.0, 17.0, 14.0, 8.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01403045654296875, -0.013691902160644531, -0.013353347778320312, -0.013014793395996094, -0.012676239013671875, -0.012337684631347656, -0.011999130249023438, -0.011660575866699219, -0.011322021484375, -0.010983467102050781, -0.010644912719726562, -0.010306358337402344, -0.009967803955078125, -0.009629249572753906, -0.009290695190429688, -0.008952140808105469, -0.00861358642578125, -0.008275032043457031, -0.007936477661132812, -0.007597923278808594, -0.007259368896484375, -0.006920814514160156, -0.0065822601318359375, -0.006243705749511719, -0.0059051513671875, -0.005566596984863281, -0.0052280426025390625, -0.004889488220214844, -0.004550933837890625, -0.004212379455566406, -0.0038738250732421875, -0.0035352706909179688, -0.00319671630859375, -0.0028581619262695312, -0.0025196075439453125, -0.0021810531616210938, -0.001842498779296875, -0.0015039443969726562, -0.0011653900146484375, -0.0008268356323242188, -0.00048828125, -0.00014972686767578125, 0.0001888275146484375, 0.0005273818969726562, 0.000865936279296875, 0.0012044906616210938, 0.0015430450439453125, 0.0018815994262695312, 0.00222015380859375, 0.0025587081909179688, 0.0028972625732421875, 0.0032358169555664062, 0.003574371337890625, 0.003912925720214844, 0.0042514801025390625, 0.004590034484863281, 0.0049285888671875, 0.005267143249511719, 0.0056056976318359375, 0.005944252014160156, 0.006282806396484375, 0.006621360778808594, 0.0069599151611328125, 0.007298469543457031, 0.00763702392578125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 22.0, 162.0, 530.0, 234.0, 40.0, 8.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035944804549217224, -0.03364570438861847, -0.031346604228019714, -0.02904750220477581, -0.026748402044177055, -0.0244493018835783, -0.022150199860334396, -0.01985109969973564, -0.017551999539136887, -0.015252899378538132, -0.012953798286616802, -0.010654697194695473, -0.008355597034096718, -0.006056496873497963, -0.0037573957815766335, -0.001458294689655304, 0.0008408054709434509, 0.003139906097203493, 0.005439006723463535, 0.0077381073497235775, 0.01003720797598362, 0.012336308136582375, 0.014635409228503704, 0.016934510320425034, 0.01923361048102379, 0.021532710641622543, 0.023831810802221298, 0.026130912825465202, 0.028430012986063957, 0.030729113146662712, 0.033028215169906616, 0.03532731533050537, 0.03762642294168472, 0.03992552310228348, 0.04222462326288223, 0.04452372342348099, 0.04682282358407974, 0.0491219237446785, 0.05142102763056755, 0.053720127791166306, 0.05601922795176506, 0.058318328112363815, 0.06061742827296257, 0.06291653215885162, 0.06521563231945038, 0.06751473248004913, 0.06981383264064789, 0.07211293280124664, 0.0744120329618454, 0.07671113312244415, 0.07901023328304291, 0.08130933344364166, 0.08360843360424042, 0.08590753376483917, 0.08820663392543793, 0.09050573408603668, 0.09280483424663544, 0.09510393440723419, 0.09740303456783295, 0.0997021347284317, 0.10200123488903046, 0.10430033504962921, 0.10659943521022797, 0.10889853537082672, 0.11119764298200607]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 6.0, 13.0, 27.0, 43.0, 42.0, 66.0, 75.0, 113.0, 95.0, 91.0, 89.0, 78.0, 88.0, 50.0, 52.0, 29.0, 19.0, 12.0, 5.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030101478099822998, -0.02927098609507084, -0.02844049409031868, -0.02761000208556652, -0.02677951008081436, -0.025949018076062202, -0.025118526071310043, -0.024288034066557884, -0.023457542061805725, -0.022627050057053566, -0.021796558052301407, -0.020966066047549248, -0.02013557404279709, -0.01930508203804493, -0.01847459003329277, -0.01764409802854061, -0.016813606023788452, -0.015983114019036293, -0.015152622014284134, -0.014322130009531975, -0.013491638004779816, -0.012661146000027657, -0.011830653995275497, -0.011000161990523338, -0.01016966998577118, -0.00933917798101902, -0.008508685976266861, -0.007678193971514702, -0.006847701966762543, -0.006017209962010384, -0.0051867179572582245, -0.004356225952506065, -0.0035257339477539062, -0.002695241943001747, -0.001864749938249588, -0.001034257933497429, -0.00020376592874526978, 0.0006267260760068893, 0.0014572180807590485, 0.0022877100855112076, 0.0031182020902633667, 0.003948694095015526, 0.004779186099767685, 0.005609678104519844, 0.006440170109272003, 0.007270662114024162, 0.008101154118776321, 0.00893164612352848, 0.00976213812828064, 0.010592630133032799, 0.011423122137784958, 0.012253614142537117, 0.013084106147289276, 0.013914598152041435, 0.014745090156793594, 0.015575582161545753, 0.016406074166297913, 0.01723656617105007, 0.01806705817580223, 0.01889755018055439, 0.01972804218530655, 0.020558534190058708, 0.021389026194810867, 0.022219518199563026, 0.023050010204315186]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 8.0, 10.0, 14.0, 34.0, 31.0, 56.0, 89.0, 121.0, 199.0, 360.0, 559.0, 1084.0, 3728.0, 168843.0, 857502.0, 12392.0, 1623.0, 765.0, 416.0, 256.0, 147.0, 97.0, 70.0, 36.0, 33.0, 21.0, 22.0, 9.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022308349609375, -0.021615982055664062, -0.020923614501953125, -0.020231246948242188, -0.01953887939453125, -0.018846511840820312, -0.018154144287109375, -0.017461776733398438, -0.0167694091796875, -0.016077041625976562, -0.015384674072265625, -0.014692306518554688, -0.01399993896484375, -0.013307571411132812, -0.012615203857421875, -0.011922836303710938, -0.01123046875, -0.010538101196289062, -0.009845733642578125, -0.009153366088867188, -0.00846099853515625, -0.0077686309814453125, -0.007076263427734375, -0.0063838958740234375, -0.0056915283203125, -0.0049991607666015625, -0.004306793212890625, -0.0036144256591796875, -0.00292205810546875, -0.0022296905517578125, -0.001537322998046875, -0.0008449554443359375, -0.000152587890625, 0.0005397796630859375, 0.001232147216796875, 0.0019245147705078125, 0.00261688232421875, 0.0033092498779296875, 0.004001617431640625, 0.0046939849853515625, 0.0053863525390625, 0.0060787200927734375, 0.006771087646484375, 0.0074634552001953125, 0.00815582275390625, 0.008848190307617188, 0.009540557861328125, 0.010232925415039062, 0.01092529296875, 0.011617660522460938, 0.012310028076171875, 0.013002395629882812, 0.01369476318359375, 0.014387130737304688, 0.015079498291015625, 0.015771865844726562, 0.0164642333984375, 0.017156600952148438, 0.017848968505859375, 0.018541336059570312, 0.01923370361328125, 0.019926071166992188, 0.020618438720703125, 0.021310806274414062, 0.022003173828125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 11.0, 86.0, 295.0, 404.0, 171.0, 39.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.02301025390625, -0.022478222846984863, -0.021946191787719727, -0.02141416072845459, -0.020882129669189453, -0.020350098609924316, -0.01981806755065918, -0.019286036491394043, -0.018754005432128906, -0.01822197437286377, -0.017689943313598633, -0.017157912254333496, -0.01662588119506836, -0.016093850135803223, -0.015561819076538086, -0.01502978801727295, -0.014497756958007812, -0.013965725898742676, -0.013433694839477539, -0.012901663780212402, -0.012369632720947266, -0.011837601661682129, -0.011305570602416992, -0.010773539543151855, -0.010241508483886719, -0.009709477424621582, -0.009177446365356445, -0.008645415306091309, -0.008113384246826172, -0.007581353187561035, -0.0070493221282958984, -0.006517291069030762, -0.005985260009765625, -0.005453228950500488, -0.0049211978912353516, -0.004389166831970215, -0.003857135772705078, -0.0033251047134399414, -0.0027930736541748047, -0.002261042594909668, -0.0017290115356445312, -0.0011969804763793945, -0.0006649494171142578, -0.0001329183578491211, 0.0003991127014160156, 0.0009311437606811523, 0.001463174819946289, 0.0019952058792114258, 0.0025272369384765625, 0.0030592679977416992, 0.003591299057006836, 0.004123330116271973, 0.004655361175537109, 0.005187392234802246, 0.005719423294067383, 0.0062514543533325195, 0.006783485412597656, 0.007315516471862793, 0.00784754753112793, 0.008379578590393066, 0.008911609649658203, 0.00944364070892334, 0.009975671768188477, 0.010507702827453613, 0.01103973388671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 8.0, 5.0, 7.0, 10.0, 10.0, 14.0, 20.0, 42.0, 82.0, 78.0, 122.0, 212.0, 443.0, 747.0, 1597.0, 3878.0, 10560.0, 31930.0, 103894.0, 306210.0, 371731.0, 147846.0, 45021.0, 14548.0, 5126.0, 2188.0, 951.0, 481.0, 312.0, 173.0, 96.0, 72.0, 31.0, 31.0, 33.0, 15.0, 13.0, 9.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00505828857421875, -0.00490570068359375, -0.00475311279296875, -0.00460052490234375, -0.00444793701171875, -0.00429534912109375, -0.00414276123046875, -0.00399017333984375, -0.00383758544921875, -0.00368499755859375, -0.00353240966796875, -0.00337982177734375, -0.00322723388671875, -0.00307464599609375, -0.00292205810546875, -0.00276947021484375, -0.00261688232421875, -0.00246429443359375, -0.00231170654296875, -0.00215911865234375, -0.00200653076171875, -0.00185394287109375, -0.00170135498046875, -0.00154876708984375, -0.00139617919921875, -0.00124359130859375, -0.00109100341796875, -0.00093841552734375, -0.00078582763671875, -0.00063323974609375, -0.00048065185546875, -0.00032806396484375, -0.00017547607421875, -2.288818359375e-05, 0.00012969970703125, 0.00028228759765625, 0.00043487548828125, 0.00058746337890625, 0.00074005126953125, 0.00089263916015625, 0.00104522705078125, 0.00119781494140625, 0.00135040283203125, 0.00150299072265625, 0.00165557861328125, 0.00180816650390625, 0.00196075439453125, 0.00211334228515625, 0.00226593017578125, 0.00241851806640625, 0.00257110595703125, 0.00272369384765625, 0.00287628173828125, 0.00302886962890625, 0.00318145751953125, 0.00333404541015625, 0.00348663330078125, 0.00363922119140625, 0.00379180908203125, 0.00394439697265625, 0.00409698486328125, 0.00424957275390625, 0.00440216064453125, 0.00455474853515625, 0.00470733642578125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 7.0, 10.0, 12.0, 21.0, 17.0, 33.0, 40.0, 32.0, 40.0, 53.0, 42.0, 51.0, 57.0, 62.0, 67.0, 73.0, 53.0, 47.0, 38.0, 41.0, 42.0, 28.0, 22.0, 26.0, 24.0, 13.0, 17.0, 8.0, 4.0, 10.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00719451904296875, -0.0069620609283447266, -0.006729602813720703, -0.00649714469909668, -0.006264686584472656, -0.006032228469848633, -0.005799770355224609, -0.005567312240600586, -0.0053348541259765625, -0.005102396011352539, -0.004869937896728516, -0.004637479782104492, -0.004405021667480469, -0.004172563552856445, -0.003940105438232422, -0.0037076473236083984, -0.003475189208984375, -0.0032427310943603516, -0.003010272979736328, -0.0027778148651123047, -0.0025453567504882812, -0.002312898635864258, -0.0020804405212402344, -0.001847982406616211, -0.0016155242919921875, -0.001383066177368164, -0.0011506080627441406, -0.0009181499481201172, -0.0006856918334960938, -0.0004532337188720703, -0.00022077560424804688, 1.1682510375976562e-05, 0.000244140625, 0.00047659873962402344, 0.0007090568542480469, 0.0009415149688720703, 0.0011739730834960938, 0.0014064311981201172, 0.0016388893127441406, 0.001871347427368164, 0.0021038055419921875, 0.002336263656616211, 0.0025687217712402344, 0.002801179885864258, 0.0030336380004882812, 0.0032660961151123047, 0.003498554229736328, 0.0037310123443603516, 0.003963470458984375, 0.0041959285736083984, 0.004428386688232422, 0.004660844802856445, 0.004893302917480469, 0.005125761032104492, 0.005358219146728516, 0.005590677261352539, 0.0058231353759765625, 0.006055593490600586, 0.006288051605224609, 0.006520509719848633, 0.006752967834472656, 0.00698542594909668, 0.007217884063720703, 0.0074503421783447266, 0.00768280029296875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 13.0, 7.0, 13.0, 16.0, 11.0, 20.0, 32.0, 37.0, 55.0, 82.0, 129.0, 154.0, 301.0, 503.0, 813.0, 1389.0, 2626.0, 4636.0, 9044.0, 18493.0, 42386.0, 109623.0, 298146.0, 337613.0, 129967.0, 49314.0, 21155.0, 10078.0, 5134.0, 2821.0, 1521.0, 897.0, 562.0, 334.0, 205.0, 123.0, 87.0, 61.0, 49.0, 36.0, 18.0, 13.0, 9.0, 10.0, 5.0, 5.0, 5.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.00148773193359375, -0.0014398694038391113, -0.0013920068740844727, -0.001344144344329834, -0.0012962818145751953, -0.0012484192848205566, -0.001200556755065918, -0.0011526942253112793, -0.0011048316955566406, -0.001056969165802002, -0.0010091066360473633, -0.0009612441062927246, -0.0009133815765380859, -0.0008655190467834473, -0.0008176565170288086, -0.0007697939872741699, -0.0007219314575195312, -0.0006740689277648926, -0.0006262063980102539, -0.0005783438682556152, -0.0005304813385009766, -0.0004826188087463379, -0.0004347562789916992, -0.00038689374923706055, -0.0003390312194824219, -0.0002911686897277832, -0.00024330615997314453, -0.00019544363021850586, -0.0001475811004638672, -9.971857070922852e-05, -5.1856040954589844e-05, -3.993511199951172e-06, 4.38690185546875e-05, 9.173154830932617e-05, 0.00013959407806396484, 0.00018745660781860352, 0.0002353191375732422, 0.00028318166732788086, 0.00033104419708251953, 0.0003789067268371582, 0.0004267692565917969, 0.00047463178634643555, 0.0005224943161010742, 0.0005703568458557129, 0.0006182193756103516, 0.0006660819053649902, 0.0007139444351196289, 0.0007618069648742676, 0.0008096694946289062, 0.0008575320243835449, 0.0009053945541381836, 0.0009532570838928223, 0.001001119613647461, 0.0010489821434020996, 0.0010968446731567383, 0.001144707202911377, 0.0011925697326660156, 0.0012404322624206543, 0.001288294792175293, 0.0013361573219299316, 0.0013840198516845703, 0.001431882381439209, 0.0014797449111938477, 0.0015276074409484863, 0.001575469970703125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 4.0, 3.0, 17.0, 9.0, 17.0, 10.0, 14.0, 18.0, 33.0, 44.0, 49.0, 75.0, 81.0, 95.0, 89.0, 88.0, 74.0, 54.0, 42.0, 24.0, 29.0, 19.0, 20.0, 16.0, 12.0, 9.0, 6.0, 5.0, 2.0, 6.0, 5.0, 3.0, 8.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010460615158081055, -0.000101444311439991, -9.828247129917145e-05, -9.51206311583519e-05, -9.195879101753235e-05, -8.87969508767128e-05, -8.563511073589325e-05, -8.24732705950737e-05, -7.931143045425415e-05, -7.61495903134346e-05, -7.298775017261505e-05, -6.98259100317955e-05, -6.666406989097595e-05, -6.35022297501564e-05, -6.034038960933685e-05, -5.7178549468517303e-05, -5.4016709327697754e-05, -5.0854869186878204e-05, -4.7693029046058655e-05, -4.4531188905239105e-05, -4.1369348764419556e-05, -3.8207508623600006e-05, -3.5045668482780457e-05, -3.188382834196091e-05, -2.8721988201141357e-05, -2.5560148060321808e-05, -2.2398307919502258e-05, -1.923646777868271e-05, -1.607462763786316e-05, -1.291278749704361e-05, -9.75094735622406e-06, -6.5891072154045105e-06, -3.427267074584961e-06, -2.654269337654114e-07, 2.896413207054138e-06, 6.058253347873688e-06, 9.220093488693237e-06, 1.2381933629512787e-05, 1.5543773770332336e-05, 1.8705613911151886e-05, 2.1867454051971436e-05, 2.5029294192790985e-05, 2.8191134333610535e-05, 3.1352974474430084e-05, 3.4514814615249634e-05, 3.767665475606918e-05, 4.083849489688873e-05, 4.400033503770828e-05, 4.716217517852783e-05, 5.032401531934738e-05, 5.348585546016693e-05, 5.664769560098648e-05, 5.980953574180603e-05, 6.297137588262558e-05, 6.613321602344513e-05, 6.929505616426468e-05, 7.245689630508423e-05, 7.561873644590378e-05, 7.878057658672333e-05, 8.194241672754288e-05, 8.510425686836243e-05, 8.826609700918198e-05, 9.142793715000153e-05, 9.458977729082108e-05, 9.775161743164062e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 4.0, 11.0, 16.0, 22.0, 18.0, 39.0, 58.0, 84.0, 190.0, 266.0, 504.0, 943.0, 1749.0, 3662.0, 7513.0, 16549.0, 41701.0, 126837.0, 416506.0, 293595.0, 84566.0, 29559.0, 12541.0, 5644.0, 2812.0, 1402.0, 746.0, 407.0, 232.0, 134.0, 83.0, 54.0, 35.0, 22.0, 20.0, 12.0, 8.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019407272338867188, -0.0018777698278427124, -0.001814812421798706, -0.0017518550157546997, -0.0016888976097106934, -0.001625940203666687, -0.0015629827976226807, -0.0015000253915786743, -0.001437067985534668, -0.0013741105794906616, -0.0013111531734466553, -0.001248195767402649, -0.0011852383613586426, -0.0011222809553146362, -0.0010593235492706299, -0.0009963661432266235, -0.0009334087371826172, -0.0008704513311386108, -0.0008074939250946045, -0.0007445365190505981, -0.0006815791130065918, -0.0006186217069625854, -0.0005556643009185791, -0.0004927068948745728, -0.0004297494888305664, -0.00036679208278656006, -0.0003038346767425537, -0.00024087727069854736, -0.00017791986465454102, -0.00011496245861053467, -5.200505256652832e-05, 1.0952353477478027e-05, 7.390975952148438e-05, 0.00013686716556549072, 0.00019982457160949707, 0.0002627819776535034, 0.00032573938369750977, 0.0003886967897415161, 0.00045165419578552246, 0.0005146116018295288, 0.0005775690078735352, 0.0006405264139175415, 0.0007034838199615479, 0.0007664412260055542, 0.0008293986320495605, 0.0008923560380935669, 0.0009553134441375732, 0.0010182708501815796, 0.001081228256225586, 0.0011441856622695923, 0.0012071430683135986, 0.001270100474357605, 0.0013330578804016113, 0.0013960152864456177, 0.001458972692489624, 0.0015219300985336304, 0.0015848875045776367, 0.001647844910621643, 0.0017108023166656494, 0.0017737597227096558, 0.0018367171287536621, 0.0018996745347976685, 0.001962631940841675, 0.002025589346885681, 0.0020885467529296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 0.0, 5.0, 2.0, 7.0, 6.0, 10.0, 8.0, 11.0, 21.0, 16.0, 21.0, 37.0, 39.0, 73.0, 82.0, 92.0, 105.0, 106.0, 95.0, 61.0, 40.0, 40.0, 32.0, 12.0, 16.0, 11.0, 8.0, 10.0, 8.0, 5.0, 5.0, 3.0, 0.0, 2.0, 5.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0018978118896484375, -0.001833587884902954, -0.0017693638801574707, -0.0017051398754119873, -0.001640915870666504, -0.0015766918659210205, -0.0015124678611755371, -0.0014482438564300537, -0.0013840198516845703, -0.001319795846939087, -0.0012555718421936035, -0.0011913478374481201, -0.0011271238327026367, -0.0010628998279571533, -0.00099867582321167, -0.0009344518184661865, -0.0008702278137207031, -0.0008060038089752197, -0.0007417798042297363, -0.0006775557994842529, -0.0006133317947387695, -0.0005491077899932861, -0.00048488378524780273, -0.00042065978050231934, -0.00035643577575683594, -0.00029221177101135254, -0.00022798776626586914, -0.00016376376152038574, -9.953975677490234e-05, -3.5315752029418945e-05, 2.8908252716064453e-05, 9.313225746154785e-05, 0.00015735626220703125, 0.00022158026695251465, 0.00028580427169799805, 0.00035002827644348145, 0.00041425228118896484, 0.00047847628593444824, 0.0005427002906799316, 0.000606924295425415, 0.0006711483001708984, 0.0007353723049163818, 0.0007995963096618652, 0.0008638203144073486, 0.000928044319152832, 0.0009922683238983154, 0.0010564923286437988, 0.0011207163333892822, 0.0011849403381347656, 0.001249164342880249, 0.0013133883476257324, 0.0013776123523712158, 0.0014418363571166992, 0.0015060603618621826, 0.001570284366607666, 0.0016345083713531494, 0.0016987323760986328, 0.0017629563808441162, 0.0018271803855895996, 0.001891404390335083, 0.0019556283950805664, 0.00201985239982605, 0.002084076404571533, 0.0021483004093170166, 0.0022125244140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 16.0, 11.0, 23.0, 23.0, 40.0, 68.0, 98.0, 131.0, 117.0, 131.0, 111.0, 83.0, 39.0, 37.0, 19.0, 12.0, 14.0, 11.0, 2.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.027160223573446274, -0.02648690529167652, -0.025813588872551918, -0.025140270590782166, -0.024466952309012413, -0.02379363402724266, -0.023120317608118057, -0.022446999326348305, -0.021773681044578552, -0.0211003627628088, -0.020427046343684196, -0.019753728061914444, -0.01908040978014469, -0.01840709149837494, -0.017733775079250336, -0.017060456797480583, -0.01638714037835598, -0.015713822096586227, -0.01504050474613905, -0.014367187395691872, -0.01369386911392212, -0.013020551763474941, -0.012347234413027763, -0.01167391613125801, -0.011000598780810833, -0.010327281430363655, -0.009653963148593903, -0.008980645798146725, -0.008307328447699547, -0.007634010165929794, -0.006960692815482616, -0.006287374999374151, -0.005614057183265686, -0.004940739367157221, -0.004267421551048756, -0.0035941042006015778, -0.0029207863844931126, -0.0022474685683846474, -0.0015741512179374695, -0.0009008334018290043, -0.0002275155857205391, 0.0004458021139726043, 0.0011191198136657476, 0.0017924373969435692, 0.0024657552130520344, 0.0031390730291604996, 0.0038123903796076775, 0.004485708195716143, 0.005159026011824608, 0.005832343827933073, 0.006505661644041538, 0.007178978994488716, 0.007852297276258469, 0.008525614626705647, 0.009198931977152824, 0.009872250258922577, 0.010545567609369755, 0.011218884959816933, 0.011892203241586685, 0.012565520592033863, 0.013238837942481041, 0.013912156224250793, 0.014585473574697971, 0.01525879092514515, 0.0159321092069149]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 2.0, 7.0, 11.0, 13.0, 12.0, 11.0, 14.0, 20.0, 13.0, 21.0, 24.0, 33.0, 29.0, 35.0, 33.0, 45.0, 35.0, 32.0, 51.0, 53.0, 34.0, 47.0, 40.0, 39.0, 33.0, 42.0, 33.0, 34.0, 29.0, 19.0, 27.0, 19.0, 25.0, 16.0, 13.0, 10.0, 16.0, 9.0, 6.0, 9.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01225346326828003, -0.011786194518208504, -0.011318925768136978, -0.010851657018065453, -0.010384388267993927, -0.009917119517922401, -0.009449850767850876, -0.00898258201777935, -0.008515313267707825, -0.0080480445176363, -0.0075807757675647736, -0.007113507017493248, -0.006646238267421722, -0.006178969517350197, -0.005711700767278671, -0.005244432017207146, -0.00477716326713562, -0.0043098945170640945, -0.003842625766992569, -0.0033753570169210434, -0.002908088266849518, -0.0024408195167779922, -0.0019735507667064667, -0.001506282016634941, -0.0010390132665634155, -0.00057174451649189, -0.00010447576642036438, 0.0003627929836511612, 0.0008300617337226868, 0.0012973304837942123, 0.001764599233865738, 0.0022318679839372635, 0.002699136734008789, 0.0031664054840803146, 0.00363367423415184, 0.004100942984223366, 0.004568211734294891, 0.005035480484366417, 0.0055027492344379425, 0.005970017984509468, 0.006437286734580994, 0.006904555484652519, 0.007371824234724045, 0.00783909298479557, 0.008306361734867096, 0.008773630484938622, 0.009240899235010147, 0.009708167985081673, 0.010175436735153198, 0.010642705485224724, 0.01110997423529625, 0.011577242985367775, 0.0120445117354393, 0.012511780485510826, 0.012979049235582352, 0.013446317985653877, 0.013913586735725403, 0.014380855485796928, 0.014848124235868454, 0.01531539298593998, 0.015782661736011505, 0.01624993048608303, 0.016717199236154556, 0.017184467986226082, 0.017651736736297607]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 13.0, 21.0, 42.0, 68.0, 129.0, 276.0, 625.0, 2399.0, 51148.0, 4128148.0, 8413.0, 1915.0, 757.0, 175.0, 74.0, 31.0, 14.0, 11.0, 6.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.027923583984375, -0.026900291442871094, -0.025876998901367188, -0.02485370635986328, -0.023830413818359375, -0.02280712127685547, -0.021783828735351562, -0.020760536193847656, -0.01973724365234375, -0.018713951110839844, -0.017690658569335938, -0.01666736602783203, -0.015644073486328125, -0.014620780944824219, -0.013597488403320312, -0.012574195861816406, -0.0115509033203125, -0.010527610778808594, -0.009504318237304688, -0.008481025695800781, -0.007457733154296875, -0.006434440612792969, -0.0054111480712890625, -0.004387855529785156, -0.00336456298828125, -0.0023412704467773438, -0.0013179779052734375, -0.00029468536376953125, 0.000728607177734375, 0.0017518997192382812, 0.0027751922607421875, 0.0037984848022460938, 0.00482177734375, 0.005845069885253906, 0.0068683624267578125, 0.007891654968261719, 0.008914947509765625, 0.009938240051269531, 0.010961532592773438, 0.011984825134277344, 0.01300811767578125, 0.014031410217285156, 0.015054702758789062, 0.01607799530029297, 0.017101287841796875, 0.01812458038330078, 0.019147872924804688, 0.020171165466308594, 0.0211944580078125, 0.022217750549316406, 0.023241043090820312, 0.02426433563232422, 0.025287628173828125, 0.02631092071533203, 0.027334213256835938, 0.028357505798339844, 0.02938079833984375, 0.030404090881347656, 0.03142738342285156, 0.03245067596435547, 0.033473968505859375, 0.03449726104736328, 0.03552055358886719, 0.036543846130371094, 0.037567138671875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 28.0, 138.0, 380.0, 326.0, 117.0, 15.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0221099853515625, -0.021582484245300293, -0.021054983139038086, -0.02052748203277588, -0.019999980926513672, -0.019472479820251465, -0.018944978713989258, -0.01841747760772705, -0.017889976501464844, -0.017362475395202637, -0.01683497428894043, -0.016307473182678223, -0.015779972076416016, -0.015252470970153809, -0.014724969863891602, -0.014197468757629395, -0.013669967651367188, -0.01314246654510498, -0.012614965438842773, -0.012087464332580566, -0.01155996322631836, -0.011032462120056152, -0.010504961013793945, -0.009977459907531738, -0.009449958801269531, -0.008922457695007324, -0.008394956588745117, -0.00786745548248291, -0.007339954376220703, -0.006812453269958496, -0.006284952163696289, -0.005757451057434082, -0.005229949951171875, -0.004702448844909668, -0.004174947738647461, -0.003647446632385254, -0.003119945526123047, -0.00259244441986084, -0.002064943313598633, -0.0015374422073364258, -0.0010099411010742188, -0.0004824399948120117, 4.506111145019531e-05, 0.0005725622177124023, 0.0011000633239746094, 0.0016275644302368164, 0.0021550655364990234, 0.0026825666427612305, 0.0032100677490234375, 0.0037375688552856445, 0.0042650699615478516, 0.004792571067810059, 0.005320072174072266, 0.005847573280334473, 0.00637507438659668, 0.006902575492858887, 0.007430076599121094, 0.0079575777053833, 0.008485078811645508, 0.009012579917907715, 0.009540081024169922, 0.010067582130432129, 0.010595083236694336, 0.011122584342956543, 0.01165008544921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 7.0, 9.0, 17.0, 18.0, 41.0, 48.0, 78.0, 130.0, 278.0, 549.0, 1452.0, 4164.0, 19883.0, 373285.0, 3730642.0, 52411.0, 7416.0, 2239.0, 811.0, 383.0, 160.0, 89.0, 58.0, 48.0, 21.0, 16.0, 11.0, 6.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0130615234375, -0.01271975040435791, -0.01237797737121582, -0.01203620433807373, -0.01169443130493164, -0.01135265827178955, -0.011010885238647461, -0.010669112205505371, -0.010327339172363281, -0.009985566139221191, -0.009643793106079102, -0.009302020072937012, -0.008960247039794922, -0.008618474006652832, -0.008276700973510742, -0.007934927940368652, -0.0075931549072265625, -0.007251381874084473, -0.006909608840942383, -0.006567835807800293, -0.006226062774658203, -0.005884289741516113, -0.0055425167083740234, -0.005200743675231934, -0.004858970642089844, -0.004517197608947754, -0.004175424575805664, -0.0038336515426635742, -0.0034918785095214844, -0.0031501054763793945, -0.0028083324432373047, -0.002466559410095215, -0.002124786376953125, -0.0017830133438110352, -0.0014412403106689453, -0.0010994672775268555, -0.0007576942443847656, -0.0004159212112426758, -7.414817810058594e-05, 0.0002676248550415039, 0.0006093978881835938, 0.0009511709213256836, 0.0012929439544677734, 0.0016347169876098633, 0.001976490020751953, 0.002318263053894043, 0.002660036087036133, 0.0030018091201782227, 0.0033435821533203125, 0.0036853551864624023, 0.004027128219604492, 0.004368901252746582, 0.004710674285888672, 0.005052447319030762, 0.0053942203521728516, 0.005735993385314941, 0.006077766418457031, 0.006419539451599121, 0.006761312484741211, 0.007103085517883301, 0.007444858551025391, 0.0077866315841674805, 0.00812840461730957, 0.00847017765045166, 0.00881195068359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 22.0, 29.0, 48.0, 102.0, 321.0, 1838.0, 1296.0, 205.0, 103.0, 43.0, 17.0, 16.0, 9.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00830841064453125, -0.007960796356201172, -0.007613182067871094, -0.007265567779541016, -0.0069179534912109375, -0.006570339202880859, -0.006222724914550781, -0.005875110626220703, -0.005527496337890625, -0.005179882049560547, -0.004832267761230469, -0.004484653472900391, -0.0041370391845703125, -0.0037894248962402344, -0.0034418106079101562, -0.003094196319580078, -0.00274658203125, -0.002398967742919922, -0.0020513534545898438, -0.0017037391662597656, -0.0013561248779296875, -0.0010085105895996094, -0.0006608963012695312, -0.0003132820129394531, 3.4332275390625e-05, 0.0003819465637207031, 0.0007295608520507812, 0.0010771751403808594, 0.0014247894287109375, 0.0017724037170410156, 0.0021200180053710938, 0.002467632293701172, 0.00281524658203125, 0.003162860870361328, 0.0035104751586914062, 0.0038580894470214844, 0.0042057037353515625, 0.004553318023681641, 0.004900932312011719, 0.005248546600341797, 0.005596160888671875, 0.005943775177001953, 0.006291389465332031, 0.006639003753662109, 0.0069866180419921875, 0.007334232330322266, 0.007681846618652344, 0.008029460906982422, 0.0083770751953125, 0.008724689483642578, 0.009072303771972656, 0.009419918060302734, 0.009767532348632812, 0.01011514663696289, 0.010462760925292969, 0.010810375213623047, 0.011157989501953125, 0.011505603790283203, 0.011853218078613281, 0.01220083236694336, 0.012548446655273438, 0.012896060943603516, 0.013243675231933594, 0.013591289520263672, 0.01393890380859375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 14.0, 47.0, 249.0, 467.0, 189.0, 26.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06916815787553787, -0.06634154915809631, -0.06351494044065475, -0.060688331723213196, -0.05786171928048134, -0.05503511056303978, -0.05220850184559822, -0.049381889402866364, -0.046555280685424805, -0.043728671967983246, -0.04090206325054169, -0.03807545453310013, -0.03524884209036827, -0.03242223337292671, -0.029595624655485153, -0.026769014075398445, -0.023942407220602036, -0.021115798503160477, -0.01828918792307377, -0.01546257920563221, -0.012635969556868076, -0.009809359908103943, -0.006982751190662384, -0.004156140610575676, -0.0013295318931341171, 0.0014970775227993727, 0.0043236869387328625, 0.007150296121835709, 0.009976905770599842, 0.012803515419363976, 0.015630124136805534, 0.018456734716892242, 0.0212833434343338, 0.02410995215177536, 0.026936562731862068, 0.029763171449303627, 0.032589782029390335, 0.035416390746831894, 0.03824299946427345, 0.04106961190700531, 0.04389622062444687, 0.04672282934188843, 0.04954943805932999, 0.052376046776771545, 0.0552026592195034, 0.05802926793694496, 0.06085587665438652, 0.06368248909711838, 0.06650909781455994, 0.0693357065320015, 0.07216231524944305, 0.07498892396688461, 0.07781553268432617, 0.08064214885234833, 0.08346875011920929, 0.08629536628723145, 0.08912196755409241, 0.09194857627153397, 0.09477518498897552, 0.09760179370641708, 0.10042840242385864, 0.1032550185918808, 0.10608161985874176, 0.10890823602676392, 0.11173484474420547]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 10.0, 9.0, 9.0, 15.0, 14.0, 24.0, 32.0, 38.0, 37.0, 41.0, 59.0, 64.0, 57.0, 61.0, 59.0, 55.0, 68.0, 56.0, 45.0, 48.0, 56.0, 37.0, 24.0, 21.0, 11.0, 9.0, 17.0, 6.0, 5.0, 5.0, 6.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02516472339630127, -0.024431748315691948, -0.023698773235082626, -0.022965798154473305, -0.022232823073863983, -0.02149984799325466, -0.02076687291264534, -0.02003389783203602, -0.019300922751426697, -0.018567947670817375, -0.017834972590208054, -0.017101997509598732, -0.01636902242898941, -0.01563604734838009, -0.014903072267770767, -0.014170097187161446, -0.013437122106552124, -0.012704147025942802, -0.01197117194533348, -0.01123819686472416, -0.010505221784114838, -0.009772246703505516, -0.009039271622896194, -0.008306296542286873, -0.007573321461677551, -0.00684034638106823, -0.006107371300458908, -0.0053743962198495865, -0.004641421139240265, -0.003908446058630943, -0.0031754709780216217, -0.0024424958974123, -0.0017095208168029785, -0.0009765457361936569, -0.00024357065558433533, 0.0004894044250249863, 0.0012223795056343079, 0.0019553545862436295, 0.002688329666852951, 0.0034213047474622726, 0.004154279828071594, 0.004887254908680916, 0.005620229989290237, 0.006353205069899559, 0.007086180150508881, 0.007819155231118202, 0.008552130311727524, 0.009285105392336845, 0.010018080472946167, 0.010751055553555489, 0.01148403063416481, 0.012217005714774132, 0.012949980795383453, 0.013682955875992775, 0.014415930956602097, 0.015148906037211418, 0.01588188111782074, 0.01661485619843006, 0.017347831279039383, 0.018080806359648705, 0.018813781440258026, 0.019546756520867348, 0.02027973160147667, 0.02101270668208599, 0.021745681762695312]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 3.0, 5.0, 16.0, 8.0, 15.0, 28.0, 32.0, 29.0, 38.0, 44.0, 78.0, 91.0, 133.0, 188.0, 282.0, 436.0, 693.0, 1339.0, 4855.0, 52353.0, 790961.0, 181869.0, 10492.0, 2005.0, 881.0, 532.0, 306.0, 240.0, 147.0, 109.0, 98.0, 65.0, 38.0, 44.0, 28.0, 21.0, 13.0, 9.0, 6.0, 4.0, 3.0, 3.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.01885986328125, -0.0182647705078125, -0.017669677734375, -0.0170745849609375, -0.0164794921875, -0.0158843994140625, -0.015289306640625, -0.0146942138671875, -0.01409912109375, -0.0135040283203125, -0.012908935546875, -0.0123138427734375, -0.01171875, -0.0111236572265625, -0.010528564453125, -0.0099334716796875, -0.00933837890625, -0.0087432861328125, -0.008148193359375, -0.0075531005859375, -0.0069580078125, -0.0063629150390625, -0.005767822265625, -0.0051727294921875, -0.00457763671875, -0.0039825439453125, -0.003387451171875, -0.0027923583984375, -0.002197265625, -0.0016021728515625, -0.001007080078125, -0.0004119873046875, 0.00018310546875, 0.0007781982421875, 0.001373291015625, 0.0019683837890625, 0.0025634765625, 0.0031585693359375, 0.003753662109375, 0.0043487548828125, 0.00494384765625, 0.0055389404296875, 0.006134033203125, 0.0067291259765625, 0.00732421875, 0.0079193115234375, 0.008514404296875, 0.0091094970703125, 0.00970458984375, 0.0102996826171875, 0.010894775390625, 0.0114898681640625, 0.0120849609375, 0.0126800537109375, 0.013275146484375, 0.0138702392578125, 0.01446533203125, 0.0150604248046875, 0.015655517578125, 0.0162506103515625, 0.016845703125, 0.0174407958984375, 0.018035888671875, 0.0186309814453125, 0.01922607421875]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 24.0, 149.0, 375.0, 325.0, 113.0, 17.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0219573974609375, -0.021433234214782715, -0.02090907096862793, -0.020384907722473145, -0.01986074447631836, -0.019336581230163574, -0.01881241798400879, -0.018288254737854004, -0.01776409149169922, -0.017239928245544434, -0.01671576499938965, -0.016191601753234863, -0.015667438507080078, -0.015143275260925293, -0.014619112014770508, -0.014094948768615723, -0.013570785522460938, -0.013046622276306152, -0.012522459030151367, -0.011998295783996582, -0.011474132537841797, -0.010949969291687012, -0.010425806045532227, -0.009901642799377441, -0.009377479553222656, -0.008853316307067871, -0.008329153060913086, -0.007804989814758301, -0.007280826568603516, -0.0067566633224487305, -0.006232500076293945, -0.00570833683013916, -0.005184173583984375, -0.00466001033782959, -0.004135847091674805, -0.0036116838455200195, -0.0030875205993652344, -0.0025633573532104492, -0.002039194107055664, -0.001515030860900879, -0.0009908676147460938, -0.0004667043685913086, 5.745887756347656e-05, 0.0005816221237182617, 0.0011057853698730469, 0.001629948616027832, 0.002154111862182617, 0.0026782751083374023, 0.0032024383544921875, 0.0037266016006469727, 0.004250764846801758, 0.004774928092956543, 0.005299091339111328, 0.005823254585266113, 0.0063474178314208984, 0.006871581077575684, 0.007395744323730469, 0.007919907569885254, 0.008444070816040039, 0.008968234062194824, 0.00949239730834961, 0.010016560554504395, 0.01054072380065918, 0.011064887046813965, 0.01158905029296875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 9.0, 11.0, 15.0, 28.0, 42.0, 53.0, 74.0, 128.0, 176.0, 315.0, 485.0, 1004.0, 2057.0, 5648.0, 16937.0, 55962.0, 223855.0, 484479.0, 186453.0, 47520.0, 14336.0, 4912.0, 1936.0, 910.0, 472.0, 275.0, 146.0, 96.0, 64.0, 52.0, 33.0, 21.0, 11.0, 11.0, 9.0, 8.0, 4.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006748199462890625, -0.006492912769317627, -0.006237626075744629, -0.005982339382171631, -0.005727052688598633, -0.005471765995025635, -0.005216479301452637, -0.004961192607879639, -0.004705905914306641, -0.004450619220733643, -0.0041953325271606445, -0.0039400458335876465, -0.0036847591400146484, -0.0034294724464416504, -0.0031741857528686523, -0.0029188990592956543, -0.0026636123657226562, -0.002408325672149658, -0.00215303897857666, -0.0018977522850036621, -0.001642465591430664, -0.001387178897857666, -0.001131892204284668, -0.0008766055107116699, -0.0006213188171386719, -0.00036603212356567383, -0.00011074542999267578, 0.00014454126358032227, 0.0003998279571533203, 0.0006551146507263184, 0.0009104013442993164, 0.0011656880378723145, 0.0014209747314453125, 0.0016762614250183105, 0.0019315481185913086, 0.0021868348121643066, 0.0024421215057373047, 0.0026974081993103027, 0.0029526948928833008, 0.003207981586456299, 0.003463268280029297, 0.003718554973602295, 0.003973841667175293, 0.004229128360748291, 0.004484415054321289, 0.004739701747894287, 0.004994988441467285, 0.005250275135040283, 0.005505561828613281, 0.005760848522186279, 0.006016135215759277, 0.006271421909332275, 0.0065267086029052734, 0.0067819952964782715, 0.0070372819900512695, 0.007292568683624268, 0.007547855377197266, 0.007803142070770264, 0.008058428764343262, 0.00831371545791626, 0.008569002151489258, 0.008824288845062256, 0.009079575538635254, 0.009334862232208252, 0.00959014892578125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 10.0, 16.0, 14.0, 11.0, 25.0, 43.0, 41.0, 45.0, 41.0, 67.0, 49.0, 75.0, 62.0, 62.0, 66.0, 64.0, 54.0, 36.0, 46.0, 37.0, 37.0, 23.0, 17.0, 18.0, 14.0, 7.0, 5.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00847625732421875, -0.008148789405822754, -0.007821321487426758, -0.007493853569030762, -0.007166385650634766, -0.0068389177322387695, -0.0065114498138427734, -0.006183981895446777, -0.005856513977050781, -0.005529046058654785, -0.005201578140258789, -0.004874110221862793, -0.004546642303466797, -0.004219174385070801, -0.0038917064666748047, -0.0035642385482788086, -0.0032367706298828125, -0.0029093027114868164, -0.0025818347930908203, -0.0022543668746948242, -0.0019268989562988281, -0.001599431037902832, -0.001271963119506836, -0.0009444952011108398, -0.0006170272827148438, -0.00028955936431884766, 3.790855407714844e-05, 0.00036537647247314453, 0.0006928443908691406, 0.0010203123092651367, 0.0013477802276611328, 0.001675248146057129, 0.002002716064453125, 0.002330183982849121, 0.002657651901245117, 0.0029851198196411133, 0.0033125877380371094, 0.0036400556564331055, 0.0039675235748291016, 0.004294991493225098, 0.004622459411621094, 0.00494992733001709, 0.005277395248413086, 0.005604863166809082, 0.005932331085205078, 0.006259799003601074, 0.00658726692199707, 0.006914734840393066, 0.0072422027587890625, 0.007569670677185059, 0.007897138595581055, 0.00822460651397705, 0.008552074432373047, 0.008879542350769043, 0.009207010269165039, 0.009534478187561035, 0.009861946105957031, 0.010189414024353027, 0.010516881942749023, 0.01084434986114502, 0.011171817779541016, 0.011499285697937012, 0.011826753616333008, 0.012154221534729004, 0.012481689453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 6.0, 3.0, 7.0, 5.0, 11.0, 12.0, 18.0, 19.0, 52.0, 72.0, 118.0, 242.0, 399.0, 809.0, 1662.0, 3764.0, 9811.0, 28809.0, 101075.0, 398456.0, 368731.0, 91495.0, 27034.0, 9151.0, 3485.0, 1573.0, 773.0, 360.0, 237.0, 122.0, 82.0, 59.0, 43.0, 13.0, 17.0, 7.0, 5.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0034351348876953125, -0.003327667713165283, -0.003220200538635254, -0.0031127333641052246, -0.0030052661895751953, -0.002897799015045166, -0.0027903318405151367, -0.0026828646659851074, -0.002575397491455078, -0.002467930316925049, -0.0023604631423950195, -0.0022529959678649902, -0.002145528793334961, -0.0020380616188049316, -0.0019305944442749023, -0.001823127269744873, -0.0017156600952148438, -0.0016081929206848145, -0.0015007257461547852, -0.0013932585716247559, -0.0012857913970947266, -0.0011783242225646973, -0.001070857048034668, -0.0009633898735046387, -0.0008559226989746094, -0.0007484555244445801, -0.0006409883499145508, -0.0005335211753845215, -0.0004260540008544922, -0.0003185868263244629, -0.0002111196517944336, -0.0001036524772644043, 3.814697265625e-06, 0.0001112818717956543, 0.0002187490463256836, 0.0003262162208557129, 0.0004336833953857422, 0.0005411505699157715, 0.0006486177444458008, 0.0007560849189758301, 0.0008635520935058594, 0.0009710192680358887, 0.001078486442565918, 0.0011859536170959473, 0.0012934207916259766, 0.0014008879661560059, 0.0015083551406860352, 0.0016158223152160645, 0.0017232894897460938, 0.001830756664276123, 0.0019382238388061523, 0.0020456910133361816, 0.002153158187866211, 0.0022606253623962402, 0.0023680925369262695, 0.002475559711456299, 0.002583026885986328, 0.0026904940605163574, 0.0027979612350463867, 0.002905428409576416, 0.0030128955841064453, 0.0031203627586364746, 0.003227829933166504, 0.003335297107696533, 0.0034427642822265625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 5.0, 8.0, 7.0, 11.0, 11.0, 13.0, 20.0, 27.0, 22.0, 30.0, 41.0, 57.0, 45.0, 63.0, 68.0, 70.0, 66.0, 66.0, 63.0, 55.0, 45.0, 34.0, 29.0, 25.0, 20.0, 6.0, 12.0, 7.0, 8.0, 8.0, 7.0, 11.0, 7.0, 5.0, 4.0, 7.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.92605972290039e-05, -6.694812327623367e-05, -6.463564932346344e-05, -6.232317537069321e-05, -6.0010701417922974e-05, -5.769822746515274e-05, -5.538575351238251e-05, -5.3073279559612274e-05, -5.076080560684204e-05, -4.844833165407181e-05, -4.6135857701301575e-05, -4.382338374853134e-05, -4.151090979576111e-05, -3.9198435842990875e-05, -3.688596189022064e-05, -3.457348793745041e-05, -3.2261013984680176e-05, -2.9948540031909943e-05, -2.763606607913971e-05, -2.5323592126369476e-05, -2.3011118173599243e-05, -2.069864422082901e-05, -1.8386170268058777e-05, -1.6073696315288544e-05, -1.376122236251831e-05, -1.1448748409748077e-05, -9.136274456977844e-06, -6.823800504207611e-06, -4.511326551437378e-06, -2.1988525986671448e-06, 1.1362135410308838e-07, 2.4260953068733215e-06, 4.738569259643555e-06, 7.051043212413788e-06, 9.363517165184021e-06, 1.1675991117954254e-05, 1.3988465070724487e-05, 1.630093902349472e-05, 1.8613412976264954e-05, 2.0925886929035187e-05, 2.323836088180542e-05, 2.5550834834575653e-05, 2.7863308787345886e-05, 3.017578274011612e-05, 3.248825669288635e-05, 3.4800730645656586e-05, 3.711320459842682e-05, 3.942567855119705e-05, 4.1738152503967285e-05, 4.405062645673752e-05, 4.636310040950775e-05, 4.8675574362277985e-05, 5.098804831504822e-05, 5.330052226781845e-05, 5.5612996220588684e-05, 5.792547017335892e-05, 6.023794412612915e-05, 6.255041807889938e-05, 6.486289203166962e-05, 6.717536598443985e-05, 6.948783993721008e-05, 7.180031388998032e-05, 7.411278784275055e-05, 7.642526179552078e-05, 7.873773574829102e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 1.0, 3.0, 7.0, 7.0, 15.0, 19.0, 27.0, 51.0, 86.0, 152.0, 249.0, 510.0, 1066.0, 2278.0, 6084.0, 19368.0, 121710.0, 733356.0, 132208.0, 20294.0, 6281.0, 2490.0, 1145.0, 519.0, 260.0, 135.0, 77.0, 44.0, 42.0, 19.0, 17.0, 9.0, 5.0, 5.0, 7.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006824493408203125, -0.006614625453948975, -0.006404757499694824, -0.006194889545440674, -0.0059850215911865234, -0.005775153636932373, -0.005565285682678223, -0.005355417728424072, -0.005145549774169922, -0.0049356818199157715, -0.004725813865661621, -0.004515945911407471, -0.00430607795715332, -0.00409621000289917, -0.0038863420486450195, -0.003676474094390869, -0.0034666061401367188, -0.0032567381858825684, -0.003046870231628418, -0.0028370022773742676, -0.002627134323120117, -0.002417266368865967, -0.0022073984146118164, -0.001997530460357666, -0.0017876625061035156, -0.0015777945518493652, -0.0013679265975952148, -0.0011580586433410645, -0.0009481906890869141, -0.0007383227348327637, -0.0005284547805786133, -0.0003185868263244629, -0.0001087188720703125, 0.00010114908218383789, 0.0003110170364379883, 0.0005208849906921387, 0.0007307529449462891, 0.0009406208992004395, 0.0011504888534545898, 0.0013603568077087402, 0.0015702247619628906, 0.001780092716217041, 0.0019899606704711914, 0.002199828624725342, 0.002409696578979492, 0.0026195645332336426, 0.002829432487487793, 0.0030393004417419434, 0.0032491683959960938, 0.003459036350250244, 0.0036689043045043945, 0.003878772258758545, 0.004088640213012695, 0.004298508167266846, 0.004508376121520996, 0.0047182440757751465, 0.004928112030029297, 0.005137979984283447, 0.005347847938537598, 0.005557715892791748, 0.0057675838470458984, 0.005977451801300049, 0.006187319755554199, 0.00639718770980835, 0.0066070556640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 2.0, 7.0, 7.0, 8.0, 15.0, 33.0, 24.0, 41.0, 51.0, 68.0, 92.0, 106.0, 129.0, 95.0, 87.0, 55.0, 45.0, 34.0, 20.0, 17.0, 12.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0032749176025390625, -0.0031593739986419678, -0.003043830394744873, -0.0029282867908477783, -0.0028127431869506836, -0.002697199583053589, -0.002581655979156494, -0.0024661123752593994, -0.0023505687713623047, -0.00223502516746521, -0.0021194815635681152, -0.0020039379596710205, -0.0018883943557739258, -0.001772850751876831, -0.0016573071479797363, -0.0015417635440826416, -0.0014262199401855469, -0.0013106763362884521, -0.0011951327323913574, -0.0010795891284942627, -0.000964045524597168, -0.0008485019207000732, -0.0007329583168029785, -0.0006174147129058838, -0.0005018711090087891, -0.00038632750511169434, -0.0002707839012145996, -0.00015524029731750488, -3.9696693420410156e-05, 7.584691047668457e-05, 0.0001913905143737793, 0.000306934118270874, 0.00042247772216796875, 0.0005380213260650635, 0.0006535649299621582, 0.0007691085338592529, 0.0008846521377563477, 0.0010001957416534424, 0.0011157393455505371, 0.0012312829494476318, 0.0013468265533447266, 0.0014623701572418213, 0.001577913761138916, 0.0016934573650360107, 0.0018090009689331055, 0.0019245445728302002, 0.002040088176727295, 0.0021556317806243896, 0.0022711753845214844, 0.002386718988418579, 0.002502262592315674, 0.0026178061962127686, 0.0027333498001098633, 0.002848893404006958, 0.0029644370079040527, 0.0030799806118011475, 0.003195524215698242, 0.003311067819595337, 0.0034266114234924316, 0.0035421550273895264, 0.003657698631286621, 0.003773242235183716, 0.0038887858390808105, 0.004004329442977905, 0.004119873046875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 13.0, 15.0, 31.0, 71.0, 119.0, 187.0, 210.0, 156.0, 99.0, 54.0, 20.0, 12.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035235561430454254, -0.03350656479597092, -0.03177756816148758, -0.030048569664359093, -0.028319573029875755, -0.026590576395392418, -0.02486157789826393, -0.023132581263780594, -0.021403584629297256, -0.01967458799481392, -0.01794559136033058, -0.016216592863202095, -0.014487596228718758, -0.01275859959423542, -0.011029602028429508, -0.009300604462623596, -0.007571607828140259, -0.005842610727995634, -0.004113613627851009, -0.0023846165277063847, -0.00065561942756176, 0.0010733772069215775, 0.0028023747727274895, 0.0045313723385334015, 0.006260368973016739, 0.007989365607500076, 0.009718363173305988, 0.0114473607391119, 0.013176357373595238, 0.014905354008078575, 0.016634352505207062, 0.0183633491396904, 0.020092345774173737, 0.021821342408657074, 0.02355033904314041, 0.025279337540268898, 0.027008334174752235, 0.028737330809235573, 0.03046632930636406, 0.0321953259408474, 0.033924322575330734, 0.03565331920981407, 0.03738231584429741, 0.039111312478780746, 0.04084031283855438, 0.04256930947303772, 0.04429830610752106, 0.046027302742004395, 0.04775629937648773, 0.04948529601097107, 0.05121429264545441, 0.052943289279937744, 0.05467228591442108, 0.05640128254890442, 0.058130282908678055, 0.05985927954316139, 0.06158827617764473, 0.06331727653741837, 0.0650462731719017, 0.06677526980638504, 0.06850426644086838, 0.07023326307535172, 0.07196225970983505, 0.07369125634431839, 0.07542025297880173]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 2.0, 7.0, 9.0, 10.0, 11.0, 21.0, 19.0, 19.0, 11.0, 17.0, 24.0, 34.0, 27.0, 25.0, 39.0, 33.0, 24.0, 36.0, 32.0, 34.0, 44.0, 39.0, 35.0, 32.0, 45.0, 22.0, 34.0, 37.0, 33.0, 26.0, 33.0, 24.0, 24.0, 14.0, 19.0, 21.0, 12.0, 17.0, 11.0, 4.0, 2.0, 4.0, 3.0, 7.0, 6.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.017282605171203613, -0.016727164387702942, -0.01617172546684742, -0.015616285614669323, -0.015060845762491226, -0.01450540591031313, -0.013949966058135033, -0.013394526205956936, -0.012839086353778839, -0.012283646501600742, -0.011728206649422646, -0.011172766797244549, -0.010617326945066452, -0.010061887092888355, -0.009506447240710258, -0.008951007388532162, -0.008395567536354065, -0.007840127684175968, -0.007284687831997871, -0.006729247979819775, -0.006173808127641678, -0.005618368275463581, -0.005062928423285484, -0.0045074885711073875, -0.003952048718929291, -0.003396608866751194, -0.0028411690145730972, -0.0022857291623950005, -0.0017302893102169037, -0.001174849458038807, -0.0006194096058607101, -6.396975368261337e-05, 0.0004914700984954834, 0.0010469099506735802, 0.001602349802851677, 0.0021577896550297737, 0.0027132295072078705, 0.0032686693593859673, 0.003824109211564064, 0.004379549063742161, 0.004934988915920258, 0.005490428768098354, 0.006045868620276451, 0.006601308472454548, 0.007156748324632645, 0.007712188176810741, 0.008267628028988838, 0.008823067881166935, 0.009378507733345032, 0.009933947585523129, 0.010489387437701225, 0.011044827289879322, 0.011600267142057419, 0.012155706994235516, 0.012711146846413612, 0.01326658669859171, 0.013822026550769806, 0.014377466402947903, 0.014932906255126, 0.015488346107304096, 0.016043785959482193, 0.016599226742982864, 0.017154665663838387, 0.01771010458469391, 0.01826554536819458]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 7.0, 4.0, 10.0, 28.0, 36.0, 74.0, 134.0, 260.0, 639.0, 5866.0, 2393636.0, 1786817.0, 4495.0, 1540.0, 520.0, 111.0, 50.0, 35.0, 14.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0269012451171875, -0.0259401798248291, -0.024979114532470703, -0.024018049240112305, -0.023056983947753906, -0.022095918655395508, -0.02113485336303711, -0.02017378807067871, -0.019212722778320312, -0.018251657485961914, -0.017290592193603516, -0.016329526901245117, -0.015368461608886719, -0.01440739631652832, -0.013446331024169922, -0.012485265731811523, -0.011524200439453125, -0.010563135147094727, -0.009602069854736328, -0.00864100456237793, -0.007679939270019531, -0.006718873977661133, -0.005757808685302734, -0.004796743392944336, -0.0038356781005859375, -0.002874612808227539, -0.0019135475158691406, -0.0009524822235107422, 8.58306884765625e-06, 0.0009696483612060547, 0.0019307136535644531, 0.0028917789459228516, 0.00385284423828125, 0.0048139095306396484, 0.005774974822998047, 0.006736040115356445, 0.007697105407714844, 0.008658170700073242, 0.00961923599243164, 0.010580301284790039, 0.011541366577148438, 0.012502431869506836, 0.013463497161865234, 0.014424562454223633, 0.015385627746582031, 0.01634669303894043, 0.017307758331298828, 0.018268823623657227, 0.019229888916015625, 0.020190954208374023, 0.021152019500732422, 0.02211308479309082, 0.02307415008544922, 0.024035215377807617, 0.024996280670166016, 0.025957345962524414, 0.026918411254882812, 0.02787947654724121, 0.02884054183959961, 0.029801607131958008, 0.030762672424316406, 0.031723737716674805, 0.0326848030090332, 0.0336458683013916, 0.03460693359375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 47.0, 198.0, 383.0, 277.0, 89.0, 11.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.02227783203125, -0.021743297576904297, -0.021208763122558594, -0.02067422866821289, -0.020139694213867188, -0.019605159759521484, -0.01907062530517578, -0.018536090850830078, -0.018001556396484375, -0.017467021942138672, -0.01693248748779297, -0.016397953033447266, -0.015863418579101562, -0.01532888412475586, -0.014794349670410156, -0.014259815216064453, -0.01372528076171875, -0.013190746307373047, -0.012656211853027344, -0.01212167739868164, -0.011587142944335938, -0.011052608489990234, -0.010518074035644531, -0.009983539581298828, -0.009449005126953125, -0.008914470672607422, -0.008379936218261719, -0.007845401763916016, -0.0073108673095703125, -0.006776332855224609, -0.006241798400878906, -0.005707263946533203, -0.0051727294921875, -0.004638195037841797, -0.004103660583496094, -0.0035691261291503906, -0.0030345916748046875, -0.0025000572204589844, -0.0019655227661132812, -0.0014309883117675781, -0.000896453857421875, -0.0003619194030761719, 0.00017261505126953125, 0.0007071495056152344, 0.0012416839599609375, 0.0017762184143066406, 0.0023107528686523438, 0.002845287322998047, 0.00337982177734375, 0.003914356231689453, 0.004448890686035156, 0.004983425140380859, 0.0055179595947265625, 0.006052494049072266, 0.006587028503417969, 0.007121562957763672, 0.007656097412109375, 0.008190631866455078, 0.008725166320800781, 0.009259700775146484, 0.009794235229492188, 0.01032876968383789, 0.010863304138183594, 0.011397838592529297, 0.011932373046875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 7.0, 15.0, 23.0, 41.0, 77.0, 139.0, 219.0, 476.0, 931.0, 2604.0, 9991.0, 64337.0, 2624998.0, 1425488.0, 52124.0, 8750.0, 2373.0, 842.0, 381.0, 204.0, 107.0, 55.0, 28.0, 25.0, 17.0, 11.0, 4.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0111083984375, -0.010823190212249756, -0.010537981986999512, -0.010252773761749268, -0.009967565536499023, -0.00968235731124878, -0.009397149085998535, -0.009111940860748291, -0.008826732635498047, -0.008541524410247803, -0.008256316184997559, -0.007971107959747314, -0.00768589973449707, -0.007400691509246826, -0.007115483283996582, -0.006830275058746338, -0.006545066833496094, -0.00625985860824585, -0.0059746503829956055, -0.005689442157745361, -0.005404233932495117, -0.005119025707244873, -0.004833817481994629, -0.004548609256744385, -0.004263401031494141, -0.0039781928062438965, -0.0036929845809936523, -0.003407776355743408, -0.003122568130493164, -0.00283735990524292, -0.0025521516799926758, -0.0022669434547424316, -0.0019817352294921875, -0.0016965270042419434, -0.0014113187789916992, -0.001126110553741455, -0.0008409023284912109, -0.0005556941032409668, -0.00027048587799072266, 1.4722347259521484e-05, 0.0002999305725097656, 0.0005851387977600098, 0.0008703470230102539, 0.001155555248260498, 0.0014407634735107422, 0.0017259716987609863, 0.0020111799240112305, 0.0022963881492614746, 0.0025815963745117188, 0.002866804599761963, 0.003152012825012207, 0.003437221050262451, 0.0037224292755126953, 0.0040076375007629395, 0.004292845726013184, 0.004578053951263428, 0.004863262176513672, 0.005148470401763916, 0.00543367862701416, 0.005718886852264404, 0.0060040950775146484, 0.006289303302764893, 0.006574511528015137, 0.006859719753265381, 0.007144927978515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 7.0, 7.0, 5.0, 6.0, 21.0, 16.0, 54.0, 74.0, 133.0, 342.0, 1123.0, 1432.0, 444.0, 154.0, 93.0, 56.0, 34.0, 24.0, 16.0, 17.0, 6.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007572174072265625, -0.007312357425689697, -0.0070525407791137695, -0.006792724132537842, -0.006532907485961914, -0.006273090839385986, -0.006013274192810059, -0.005753457546234131, -0.005493640899658203, -0.005233824253082275, -0.004974007606506348, -0.00471419095993042, -0.004454374313354492, -0.0041945576667785645, -0.003934741020202637, -0.003674924373626709, -0.0034151077270507812, -0.0031552910804748535, -0.0028954744338989258, -0.002635657787322998, -0.0023758411407470703, -0.0021160244941711426, -0.0018562078475952148, -0.0015963912010192871, -0.0013365745544433594, -0.0010767579078674316, -0.0008169412612915039, -0.0005571246147155762, -0.00029730796813964844, -3.74913215637207e-05, 0.00022232532501220703, 0.00048214197158813477, 0.0007419586181640625, 0.0010017752647399902, 0.001261591911315918, 0.0015214085578918457, 0.0017812252044677734, 0.002041041851043701, 0.002300858497619629, 0.0025606751441955566, 0.0028204917907714844, 0.003080308437347412, 0.00334012508392334, 0.0035999417304992676, 0.0038597583770751953, 0.004119575023651123, 0.004379391670227051, 0.0046392083168029785, 0.004899024963378906, 0.005158841609954834, 0.005418658256530762, 0.0056784749031066895, 0.005938291549682617, 0.006198108196258545, 0.006457924842834473, 0.0067177414894104, 0.006977558135986328, 0.007237374782562256, 0.007497191429138184, 0.007757008075714111, 0.008016824722290039, 0.008276641368865967, 0.008536458015441895, 0.008796274662017822, 0.00905609130859375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 13.0, 27.0, 40.0, 102.0, 184.0, 238.0, 214.0, 102.0, 45.0, 19.0, 11.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.031751930713653564, -0.030411282554268837, -0.02907063439488411, -0.027729984372854233, -0.026389336213469505, -0.025048688054084778, -0.0237080380320549, -0.022367389872670174, -0.021026741713285446, -0.01968609355390072, -0.01834544539451599, -0.017004795372486115, -0.015664147213101387, -0.01432349905371666, -0.012982849963009357, -0.011642200872302055, -0.010301552712917328, -0.0089609045535326, -0.007620255462825298, -0.0062796068377792835, -0.004938958212733269, -0.003598309587687254, -0.002257660962641239, -0.0009170118719339371, 0.0004236362874507904, 0.0017642849124968052, 0.00310493353754282, 0.004445582162588835, 0.0057862307876348495, 0.007126879412680864, 0.008467528037726879, 0.009808177128434181, 0.011148829013109207, 0.012489477172493935, 0.013830126263201237, 0.015170775353908539, 0.016511423513293266, 0.017852071672677994, 0.01919272169470787, 0.020533369854092598, 0.021874018013477325, 0.023214666172862053, 0.02455531433224678, 0.025895964354276657, 0.027236612513661385, 0.028577260673046112, 0.02991791069507599, 0.031258560717105865, 0.032599207013845444, 0.03393985703587532, 0.0352805033326149, 0.036621153354644775, 0.03796180337667465, 0.03930244967341423, 0.04064309969544411, 0.041983745992183685, 0.04332439601421356, 0.04466504603624344, 0.04600569233298302, 0.047346342355012894, 0.04868698865175247, 0.05002763867378235, 0.051368288695812225, 0.0527089387178421, 0.05404958501458168]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 5.0, 8.0, 13.0, 13.0, 14.0, 23.0, 28.0, 24.0, 32.0, 36.0, 49.0, 52.0, 48.0, 64.0, 59.0, 65.0, 61.0, 45.0, 59.0, 50.0, 41.0, 38.0, 41.0, 29.0, 21.0, 23.0, 15.0, 23.0, 7.0, 6.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0205267071723938, -0.01993541419506073, -0.01934412121772766, -0.018752828240394592, -0.018161535263061523, -0.017570242285728455, -0.016978949308395386, -0.016387656331062317, -0.015796363353729248, -0.01520507037639618, -0.01461377739906311, -0.014022484421730042, -0.013431191444396973, -0.012839898467063904, -0.012248605489730835, -0.011657312512397766, -0.011066019535064697, -0.010474726557731628, -0.00988343358039856, -0.00929214060306549, -0.008700847625732422, -0.008109554648399353, -0.007518261671066284, -0.006926968693733215, -0.0063356757164001465, -0.005744382739067078, -0.005153089761734009, -0.00456179678440094, -0.003970503807067871, -0.0033792108297348022, -0.0027879178524017334, -0.0021966248750686646, -0.0016053318977355957, -0.0010140389204025269, -0.000422745943069458, 0.00016854703426361084, 0.0007598400115966797, 0.0013511329889297485, 0.0019424259662628174, 0.0025337189435958862, 0.003125011920928955, 0.003716304898262024, 0.004307597875595093, 0.004898890852928162, 0.0054901838302612305, 0.006081476807594299, 0.006672769784927368, 0.007264062762260437, 0.007855355739593506, 0.008446648716926575, 0.009037941694259644, 0.009629234671592712, 0.010220527648925781, 0.01081182062625885, 0.011403113603591919, 0.011994406580924988, 0.012585699558258057, 0.013176992535591125, 0.013768285512924194, 0.014359578490257263, 0.014950871467590332, 0.015542164444923401, 0.01613345742225647, 0.01672475039958954, 0.017316043376922607]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 6.0, 7.0, 6.0, 22.0, 23.0, 21.0, 31.0, 39.0, 46.0, 63.0, 82.0, 120.0, 160.0, 238.0, 356.0, 532.0, 835.0, 1888.0, 6653.0, 56208.0, 762679.0, 198345.0, 14119.0, 2928.0, 1114.0, 621.0, 383.0, 271.0, 203.0, 144.0, 115.0, 70.0, 47.0, 43.0, 32.0, 19.0, 23.0, 10.0, 14.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.01885986328125, -0.018245697021484375, -0.01763153076171875, -0.017017364501953125, -0.0164031982421875, -0.015789031982421875, -0.01517486572265625, -0.014560699462890625, -0.013946533203125, -0.013332366943359375, -0.01271820068359375, -0.012104034423828125, -0.0114898681640625, -0.010875701904296875, -0.01026153564453125, -0.009647369384765625, -0.009033203125, -0.008419036865234375, -0.00780487060546875, -0.007190704345703125, -0.0065765380859375, -0.005962371826171875, -0.00534820556640625, -0.004734039306640625, -0.004119873046875, -0.003505706787109375, -0.00289154052734375, -0.002277374267578125, -0.0016632080078125, -0.001049041748046875, -0.00043487548828125, 0.000179290771484375, 0.00079345703125, 0.001407623291015625, 0.00202178955078125, 0.002635955810546875, 0.0032501220703125, 0.003864288330078125, 0.00447845458984375, 0.005092620849609375, 0.005706787109375, 0.006320953369140625, 0.00693511962890625, 0.007549285888671875, 0.0081634521484375, 0.008777618408203125, 0.00939178466796875, 0.010005950927734375, 0.0106201171875, 0.011234283447265625, 0.01184844970703125, 0.012462615966796875, 0.0130767822265625, 0.013690948486328125, 0.01430511474609375, 0.014919281005859375, 0.015533447265625, 0.016147613525390625, 0.01676177978515625, 0.017375946044921875, 0.0179901123046875, 0.018604278564453125, 0.01921844482421875, 0.019832611083984375, 0.02044677734375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 6.0, 23.0, 126.0, 350.0, 322.0, 151.0, 26.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0219879150390625, -0.02146470546722412, -0.020941495895385742, -0.020418286323547363, -0.019895076751708984, -0.019371867179870605, -0.018848657608032227, -0.018325448036193848, -0.01780223846435547, -0.01727902889251709, -0.01675581932067871, -0.016232609748840332, -0.015709400177001953, -0.015186190605163574, -0.014662981033325195, -0.014139771461486816, -0.013616561889648438, -0.013093352317810059, -0.01257014274597168, -0.0120469331741333, -0.011523723602294922, -0.011000514030456543, -0.010477304458618164, -0.009954094886779785, -0.009430885314941406, -0.008907675743103027, -0.008384466171264648, -0.00786125659942627, -0.007338047027587891, -0.006814837455749512, -0.006291627883911133, -0.005768418312072754, -0.005245208740234375, -0.004721999168395996, -0.004198789596557617, -0.0036755800247192383, -0.0031523704528808594, -0.0026291608810424805, -0.0021059513092041016, -0.0015827417373657227, -0.0010595321655273438, -0.0005363225936889648, -1.3113021850585938e-05, 0.000510096549987793, 0.0010333061218261719, 0.0015565156936645508, 0.0020797252655029297, 0.0026029348373413086, 0.0031261444091796875, 0.0036493539810180664, 0.004172563552856445, 0.004695773124694824, 0.005218982696533203, 0.005742192268371582, 0.006265401840209961, 0.00678861141204834, 0.007311820983886719, 0.007835030555725098, 0.008358240127563477, 0.008881449699401855, 0.009404659271240234, 0.009927868843078613, 0.010451078414916992, 0.010974287986755371, 0.01149749755859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 7.0, 3.0, 15.0, 10.0, 22.0, 28.0, 45.0, 52.0, 81.0, 114.0, 204.0, 308.0, 538.0, 1027.0, 2101.0, 4733.0, 11160.0, 31424.0, 111130.0, 426246.0, 337769.0, 80303.0, 23952.0, 9231.0, 3967.0, 1808.0, 941.0, 520.0, 273.0, 153.0, 118.0, 73.0, 43.0, 41.0, 33.0, 12.0, 17.0, 10.0, 15.0, 5.0, 8.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-0.01058197021484375, -0.010295093059539795, -0.01000821590423584, -0.009721338748931885, -0.00943446159362793, -0.009147584438323975, -0.00886070728302002, -0.008573830127716064, -0.00828695297241211, -0.008000075817108154, -0.007713198661804199, -0.007426321506500244, -0.007139444351196289, -0.006852567195892334, -0.006565690040588379, -0.006278812885284424, -0.005991935729980469, -0.005705058574676514, -0.005418181419372559, -0.0051313042640686035, -0.0048444271087646484, -0.004557549953460693, -0.004270672798156738, -0.003983795642852783, -0.003696918487548828, -0.003410041332244873, -0.003123164176940918, -0.002836287021636963, -0.002549409866333008, -0.0022625327110290527, -0.0019756555557250977, -0.0016887784004211426, -0.0014019012451171875, -0.0011150240898132324, -0.0008281469345092773, -0.0005412697792053223, -0.0002543926239013672, 3.248453140258789e-05, 0.00031936168670654297, 0.000606238842010498, 0.0008931159973144531, 0.0011799931526184082, 0.0014668703079223633, 0.0017537474632263184, 0.0020406246185302734, 0.0023275017738342285, 0.0026143789291381836, 0.0029012560844421387, 0.0031881332397460938, 0.003475010395050049, 0.003761887550354004, 0.004048764705657959, 0.004335641860961914, 0.004622519016265869, 0.004909396171569824, 0.005196273326873779, 0.005483150482177734, 0.0057700276374816895, 0.0060569047927856445, 0.0063437819480896, 0.006630659103393555, 0.00691753625869751, 0.007204413414001465, 0.00749129056930542, 0.007778167724609375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 7.0, 4.0, 7.0, 5.0, 7.0, 14.0, 11.0, 21.0, 19.0, 29.0, 46.0, 57.0, 65.0, 75.0, 64.0, 63.0, 93.0, 72.0, 70.0, 47.0, 59.0, 35.0, 23.0, 24.0, 18.0, 19.0, 15.0, 6.0, 6.0, 6.0, 2.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.0143585205078125, -0.013967752456665039, -0.013576984405517578, -0.013186216354370117, -0.012795448303222656, -0.012404680252075195, -0.012013912200927734, -0.011623144149780273, -0.011232376098632812, -0.010841608047485352, -0.01045083999633789, -0.01006007194519043, -0.009669303894042969, -0.009278535842895508, -0.008887767791748047, -0.008496999740600586, -0.008106231689453125, -0.007715463638305664, -0.007324695587158203, -0.006933927536010742, -0.006543159484863281, -0.00615239143371582, -0.005761623382568359, -0.0053708553314208984, -0.0049800872802734375, -0.0045893192291259766, -0.004198551177978516, -0.0038077831268310547, -0.0034170150756835938, -0.003026247024536133, -0.002635478973388672, -0.002244710922241211, -0.00185394287109375, -0.001463174819946289, -0.0010724067687988281, -0.0006816387176513672, -0.00029087066650390625, 9.989738464355469e-05, 0.0004906654357910156, 0.0008814334869384766, 0.0012722015380859375, 0.0016629695892333984, 0.0020537376403808594, 0.0024445056915283203, 0.0028352737426757812, 0.003226041793823242, 0.003616809844970703, 0.004007577896118164, 0.004398345947265625, 0.004789113998413086, 0.005179882049560547, 0.005570650100708008, 0.005961418151855469, 0.00635218620300293, 0.006742954254150391, 0.0071337223052978516, 0.0075244903564453125, 0.007915258407592773, 0.008306026458740234, 0.008696794509887695, 0.009087562561035156, 0.009478330612182617, 0.009869098663330078, 0.010259866714477539, 0.010650634765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 8.0, 15.0, 25.0, 14.0, 41.0, 58.0, 75.0, 139.0, 287.0, 494.0, 962.0, 1844.0, 3863.0, 8441.0, 19449.0, 51530.0, 183814.0, 534865.0, 162383.0, 47031.0, 17898.0, 7861.0, 3740.0, 1754.0, 869.0, 455.0, 252.0, 144.0, 88.0, 47.0, 40.0, 21.0, 17.0, 10.0, 7.0, 7.0, 6.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036468505859375, -0.00351870059967041, -0.0033905506134033203, -0.0032624006271362305, -0.0031342506408691406, -0.0030061006546020508, -0.002877950668334961, -0.002749800682067871, -0.0026216506958007812, -0.0024935007095336914, -0.0023653507232666016, -0.0022372007369995117, -0.002109050750732422, -0.001980900764465332, -0.0018527507781982422, -0.0017246007919311523, -0.0015964508056640625, -0.0014683008193969727, -0.0013401508331298828, -0.001212000846862793, -0.0010838508605957031, -0.0009557008743286133, -0.0008275508880615234, -0.0006994009017944336, -0.0005712509155273438, -0.0004431009292602539, -0.00031495094299316406, -0.00018680095672607422, -5.8650970458984375e-05, 6.949901580810547e-05, 0.0001976490020751953, 0.00032579898834228516, 0.000453948974609375, 0.0005820989608764648, 0.0007102489471435547, 0.0008383989334106445, 0.0009665489196777344, 0.0010946989059448242, 0.001222848892211914, 0.001350998878479004, 0.0014791488647460938, 0.0016072988510131836, 0.0017354488372802734, 0.0018635988235473633, 0.001991748809814453, 0.002119898796081543, 0.002248048782348633, 0.0023761987686157227, 0.0025043487548828125, 0.0026324987411499023, 0.002760648727416992, 0.002888798713684082, 0.003016948699951172, 0.0031450986862182617, 0.0032732486724853516, 0.0034013986587524414, 0.0035295486450195312, 0.003657698631286621, 0.003785848617553711, 0.003913998603820801, 0.004042148590087891, 0.0041702985763549805, 0.00429844856262207, 0.00442659854888916, 0.00455474853515625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 6.0, 7.0, 14.0, 12.0, 26.0, 19.0, 30.0, 49.0, 69.0, 75.0, 124.0, 124.0, 115.0, 89.0, 64.0, 50.0, 38.0, 23.0, 23.0, 14.0, 6.0, 7.0, 7.0, 8.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00012862682342529297, -0.00012479349970817566, -0.00012096017599105835, -0.00011712685227394104, -0.00011329352855682373, -0.00010946020483970642, -0.00010562688112258911, -0.0001017935574054718, -9.796023368835449e-05, -9.412690997123718e-05, -9.029358625411987e-05, -8.646026253700256e-05, -8.262693881988525e-05, -7.879361510276794e-05, -7.496029138565063e-05, -7.112696766853333e-05, -6.729364395141602e-05, -6.34603202342987e-05, -5.9626996517181396e-05, -5.579367280006409e-05, -5.196034908294678e-05, -4.812702536582947e-05, -4.429370164871216e-05, -4.046037793159485e-05, -3.662705421447754e-05, -3.279373049736023e-05, -2.896040678024292e-05, -2.512708306312561e-05, -2.12937593460083e-05, -1.746043562889099e-05, -1.3627111911773682e-05, -9.793788194656372e-06, -5.9604644775390625e-06, -2.127140760421753e-06, 1.7061829566955566e-06, 5.539506673812866e-06, 9.372830390930176e-06, 1.3206154108047485e-05, 1.7039477825164795e-05, 2.0872801542282104e-05, 2.4706125259399414e-05, 2.8539448976516724e-05, 3.237277269363403e-05, 3.620609641075134e-05, 4.003942012786865e-05, 4.387274384498596e-05, 4.770606756210327e-05, 5.153939127922058e-05, 5.537271499633789e-05, 5.92060387134552e-05, 6.303936243057251e-05, 6.687268614768982e-05, 7.070600986480713e-05, 7.453933358192444e-05, 7.837265729904175e-05, 8.220598101615906e-05, 8.603930473327637e-05, 8.987262845039368e-05, 9.370595216751099e-05, 9.75392758846283e-05, 0.0001013725996017456, 0.00010520592331886292, 0.00010903924703598022, 0.00011287257075309753, 0.00011670589447021484]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 15.0, 16.0, 21.0, 36.0, 75.0, 107.0, 210.0, 362.0, 689.0, 1460.0, 3268.0, 7708.0, 20896.0, 70243.0, 443774.0, 400669.0, 65913.0, 19735.0, 7235.0, 3150.0, 1410.0, 709.0, 370.0, 161.0, 109.0, 73.0, 42.0, 30.0, 11.0, 16.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0], "bins": [-0.007129669189453125, -0.006946742534637451, -0.006763815879821777, -0.0065808892250061035, -0.00639796257019043, -0.006215035915374756, -0.006032109260559082, -0.005849182605743408, -0.005666255950927734, -0.0054833292961120605, -0.005300402641296387, -0.005117475986480713, -0.004934549331665039, -0.004751622676849365, -0.004568696022033691, -0.004385769367218018, -0.004202842712402344, -0.00401991605758667, -0.003836989402770996, -0.0036540627479553223, -0.0034711360931396484, -0.0032882094383239746, -0.0031052827835083008, -0.002922356128692627, -0.002739429473876953, -0.0025565028190612793, -0.0023735761642456055, -0.0021906495094299316, -0.002007722854614258, -0.001824796199798584, -0.0016418695449829102, -0.0014589428901672363, -0.0012760162353515625, -0.0010930895805358887, -0.0009101629257202148, -0.000727236270904541, -0.0005443096160888672, -0.00036138296127319336, -0.00017845630645751953, 4.470348358154297e-06, 0.00018739700317382812, 0.00037032365798950195, 0.0005532503128051758, 0.0007361769676208496, 0.0009191036224365234, 0.0011020302772521973, 0.001284956932067871, 0.001467883586883545, 0.0016508102416992188, 0.0018337368965148926, 0.0020166635513305664, 0.0021995902061462402, 0.002382516860961914, 0.002565443515777588, 0.0027483701705932617, 0.0029312968254089355, 0.0031142234802246094, 0.003297150135040283, 0.003480076789855957, 0.003663003444671631, 0.0038459300994873047, 0.0040288567543029785, 0.004211783409118652, 0.004394710063934326, 0.00457763671875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 0.0, 2.0, 3.0, 3.0, 13.0, 5.0, 8.0, 9.0, 21.0, 8.0, 19.0, 20.0, 29.0, 33.0, 47.0, 66.0, 83.0, 130.0, 132.0, 96.0, 62.0, 47.0, 24.0, 24.0, 18.0, 16.0, 15.0, 8.0, 11.0, 7.0, 10.0, 5.0, 4.0, 5.0, 9.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0034332275390625, -0.0033152103424072266, -0.003197193145751953, -0.0030791759490966797, -0.0029611587524414062, -0.002843141555786133, -0.0027251243591308594, -0.002607107162475586, -0.0024890899658203125, -0.002371072769165039, -0.0022530555725097656, -0.002135038375854492, -0.0020170211791992188, -0.0018990039825439453, -0.0017809867858886719, -0.0016629695892333984, -0.001544952392578125, -0.0014269351959228516, -0.0013089179992675781, -0.0011909008026123047, -0.0010728836059570312, -0.0009548664093017578, -0.0008368492126464844, -0.0007188320159912109, -0.0006008148193359375, -0.00048279762268066406, -0.0003647804260253906, -0.0002467632293701172, -0.00012874603271484375, -1.0728836059570312e-05, 0.00010728836059570312, 0.00022530555725097656, 0.00034332275390625, 0.00046133995056152344, 0.0005793571472167969, 0.0006973743438720703, 0.0008153915405273438, 0.0009334087371826172, 0.0010514259338378906, 0.001169443130493164, 0.0012874603271484375, 0.001405477523803711, 0.0015234947204589844, 0.0016415119171142578, 0.0017595291137695312, 0.0018775463104248047, 0.001995563507080078, 0.0021135807037353516, 0.002231597900390625, 0.0023496150970458984, 0.002467632293701172, 0.0025856494903564453, 0.0027036666870117188, 0.002821683883666992, 0.0029397010803222656, 0.003057718276977539, 0.0031757354736328125, 0.003293752670288086, 0.0034117698669433594, 0.003529787063598633, 0.0036478042602539062, 0.0037658214569091797, 0.003883838653564453, 0.0040018558502197266, 0.004119873046875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 20.0, 63.0, 306.0, 402.0, 162.0, 35.0, 12.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0706605464220047, -0.06601019203662872, -0.061359845101833344, -0.05670949071645737, -0.05205914378166199, -0.04740878939628601, -0.04275843873620033, -0.038108088076114655, -0.033457737416028976, -0.0288073867559433, -0.02415703609585762, -0.019506683573126793, -0.014856332913041115, -0.010205982252955437, -0.005555629730224609, -0.0009052790701389313, 0.003745071589946747, 0.008395422250032425, 0.013045773841440678, 0.01769612543284893, 0.02234647609293461, 0.026996826753020287, 0.031647179275751114, 0.03629752993583679, 0.04094788059592247, 0.04559823125600815, 0.050248581916093826, 0.054898932576179504, 0.05954928696155548, 0.06419963389635086, 0.06884998828172684, 0.07350033521652222, 0.0781506896018982, 0.08280104398727417, 0.08745139092206955, 0.09210174530744553, 0.0967520922422409, 0.10140244662761688, 0.10605280101299286, 0.11070314794778824, 0.11535349488258362, 0.1200038492679596, 0.12465419620275497, 0.12930454313755035, 0.13395489752292633, 0.1386052519083023, 0.14325560629367828, 0.14790594577789307, 0.15255630016326904, 0.15720665454864502, 0.161857008934021, 0.16650734841823578, 0.17115770280361176, 0.17580805718898773, 0.1804584115743637, 0.1851087510585785, 0.18975912034511566, 0.19440947473049164, 0.19905982911586761, 0.2037101686000824, 0.20836052298545837, 0.21301087737083435, 0.21766123175621033, 0.2223115861415863, 0.2269619256258011]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 3.0, 5.0, 6.0, 7.0, 2.0, 12.0, 16.0, 13.0, 11.0, 19.0, 26.0, 25.0, 32.0, 30.0, 28.0, 47.0, 27.0, 29.0, 42.0, 42.0, 49.0, 42.0, 48.0, 39.0, 32.0, 45.0, 36.0, 31.0, 28.0, 32.0, 26.0, 25.0, 24.0, 22.0, 16.0, 11.0, 16.0, 10.0, 8.0, 6.0, 10.0, 5.0, 4.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.023510754108428955, -0.02280523255467415, -0.022099711000919342, -0.021394189447164536, -0.02068866789340973, -0.019983146339654922, -0.019277624785900116, -0.01857210323214531, -0.017866581678390503, -0.017161060124635696, -0.01645553857088089, -0.015750017017126083, -0.015044495463371277, -0.01433897390961647, -0.013633452355861664, -0.012927930802106857, -0.01222240924835205, -0.011516887694597244, -0.010811366140842438, -0.010105844587087631, -0.009400323033332825, -0.008694801479578018, -0.007989279925823212, -0.007283758372068405, -0.006578236818313599, -0.005872715264558792, -0.005167193710803986, -0.004461672157049179, -0.0037561506032943726, -0.003050629049539566, -0.0023451074957847595, -0.001639585942029953, -0.0009340643882751465, -0.00022854283452033997, 0.00047697871923446655, 0.001182500272989273, 0.0018880218267440796, 0.002593543380498886, 0.0032990649342536926, 0.004004586488008499, 0.004710108041763306, 0.005415629595518112, 0.006121151149272919, 0.006826672703027725, 0.007532194256782532, 0.008237715810537338, 0.008943237364292145, 0.009648758918046951, 0.010354280471801758, 0.011059802025556564, 0.01176532357931137, 0.012470845133066177, 0.013176366686820984, 0.01388188824057579, 0.014587409794330597, 0.015292931348085403, 0.01599845290184021, 0.016703974455595016, 0.017409496009349823, 0.01811501756310463, 0.018820539116859436, 0.019526060670614243, 0.02023158222436905, 0.020937103778123856, 0.021642625331878662]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 3.0, 7.0, 9.0, 10.0, 13.0, 13.0, 18.0, 25.0, 24.0, 34.0, 33.0, 52.0, 43.0, 80.0, 111.0, 144.0, 315.0, 848.0, 3082.0, 10122.0, 90748.0, 3897975.0, 172010.0, 12370.0, 2963.0, 1227.0, 785.0, 513.0, 347.0, 147.0, 70.0, 44.0, 21.0, 21.0, 9.0, 14.0, 7.0, 5.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.016632080078125, -0.0161895751953125, -0.0157470703125, -0.0153045654296875, -0.014862060546875, -0.0144195556640625, -0.01397705078125, -0.0135345458984375, -0.013092041015625, -0.0126495361328125, -0.01220703125, -0.0117645263671875, -0.011322021484375, -0.0108795166015625, -0.01043701171875, -0.0099945068359375, -0.009552001953125, -0.0091094970703125, -0.0086669921875, -0.0082244873046875, -0.007781982421875, -0.0073394775390625, -0.00689697265625, -0.0064544677734375, -0.006011962890625, -0.0055694580078125, -0.005126953125, -0.0046844482421875, -0.004241943359375, -0.0037994384765625, -0.00335693359375, -0.0029144287109375, -0.002471923828125, -0.0020294189453125, -0.0015869140625, -0.0011444091796875, -0.000701904296875, -0.0002593994140625, 0.00018310546875, 0.0006256103515625, 0.001068115234375, 0.0015106201171875, 0.001953125, 0.0023956298828125, 0.002838134765625, 0.0032806396484375, 0.00372314453125, 0.0041656494140625, 0.004608154296875, 0.0050506591796875, 0.0054931640625, 0.0059356689453125, 0.006378173828125, 0.0068206787109375, 0.00726318359375, 0.0077056884765625, 0.008148193359375, 0.0085906982421875, 0.009033203125, 0.0094757080078125, 0.009918212890625, 0.0103607177734375, 0.01080322265625, 0.0112457275390625, 0.011688232421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 10.0, 52.0, 207.0, 400.0, 240.0, 84.0, 14.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0222015380859375, -0.021667838096618652, -0.021134138107299805, -0.020600438117980957, -0.02006673812866211, -0.01953303813934326, -0.018999338150024414, -0.018465638160705566, -0.01793193817138672, -0.01739823818206787, -0.016864538192749023, -0.016330838203430176, -0.015797138214111328, -0.01526343822479248, -0.014729738235473633, -0.014196038246154785, -0.013662338256835938, -0.01312863826751709, -0.012594938278198242, -0.012061238288879395, -0.011527538299560547, -0.0109938383102417, -0.010460138320922852, -0.009926438331604004, -0.009392738342285156, -0.008859038352966309, -0.008325338363647461, -0.007791638374328613, -0.007257938385009766, -0.006724238395690918, -0.00619053840637207, -0.005656838417053223, -0.005123138427734375, -0.004589438438415527, -0.00405573844909668, -0.003522038459777832, -0.0029883384704589844, -0.0024546384811401367, -0.001920938491821289, -0.0013872385025024414, -0.0008535385131835938, -0.0003198385238647461, 0.00021386146545410156, 0.0007475614547729492, 0.0012812614440917969, 0.0018149614334106445, 0.002348661422729492, 0.00288236141204834, 0.0034160614013671875, 0.003949761390686035, 0.004483461380004883, 0.0050171613693237305, 0.005550861358642578, 0.006084561347961426, 0.0066182613372802734, 0.007151961326599121, 0.007685661315917969, 0.008219361305236816, 0.008753061294555664, 0.009286761283874512, 0.00982046127319336, 0.010354161262512207, 0.010887861251831055, 0.011421561241149902, 0.01195526123046875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 5.0, 6.0, 18.0, 23.0, 42.0, 54.0, 71.0, 154.0, 215.0, 530.0, 1247.0, 4382.0, 27122.0, 790794.0, 3306956.0, 52683.0, 6785.0, 1818.0, 681.0, 316.0, 159.0, 76.0, 45.0, 33.0, 15.0, 16.0, 8.0, 5.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01256561279296875, -0.012118935585021973, -0.011672258377075195, -0.011225581169128418, -0.01077890396118164, -0.010332226753234863, -0.009885549545288086, -0.009438872337341309, -0.008992195129394531, -0.008545517921447754, -0.008098840713500977, -0.007652163505554199, -0.007205486297607422, -0.0067588090896606445, -0.006312131881713867, -0.00586545467376709, -0.0054187774658203125, -0.004972100257873535, -0.004525423049926758, -0.0040787458419799805, -0.003632068634033203, -0.0031853914260864258, -0.0027387142181396484, -0.002292037010192871, -0.0018453598022460938, -0.0013986825942993164, -0.0009520053863525391, -0.0005053281784057617, -5.8650970458984375e-05, 0.00038802623748779297, 0.0008347034454345703, 0.0012813806533813477, 0.001728057861328125, 0.0021747350692749023, 0.0026214122772216797, 0.003068089485168457, 0.0035147666931152344, 0.003961443901062012, 0.004408121109008789, 0.004854798316955566, 0.005301475524902344, 0.005748152732849121, 0.0061948299407958984, 0.006641507148742676, 0.007088184356689453, 0.0075348615646362305, 0.007981538772583008, 0.008428215980529785, 0.008874893188476562, 0.00932157039642334, 0.009768247604370117, 0.010214924812316895, 0.010661602020263672, 0.01110827922821045, 0.011554956436157227, 0.012001633644104004, 0.012448310852050781, 0.012894988059997559, 0.013341665267944336, 0.013788342475891113, 0.01423501968383789, 0.014681696891784668, 0.015128374099731445, 0.015575051307678223, 0.016021728515625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 3.0, 7.0, 22.0, 41.0, 61.0, 104.0, 241.0, 629.0, 1616.0, 758.0, 245.0, 133.0, 75.0, 51.0, 26.0, 17.0, 11.0, 10.0, 9.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.013336181640625, -0.012989997863769531, -0.012643814086914062, -0.012297630310058594, -0.011951446533203125, -0.011605262756347656, -0.011259078979492188, -0.010912895202636719, -0.01056671142578125, -0.010220527648925781, -0.009874343872070312, -0.009528160095214844, -0.009181976318359375, -0.008835792541503906, -0.008489608764648438, -0.008143424987792969, -0.0077972412109375, -0.007451057434082031, -0.0071048736572265625, -0.006758689880371094, -0.006412506103515625, -0.006066322326660156, -0.0057201385498046875, -0.005373954772949219, -0.00502777099609375, -0.004681587219238281, -0.0043354034423828125, -0.003989219665527344, -0.003643035888671875, -0.0032968521118164062, -0.0029506683349609375, -0.0026044845581054688, -0.00225830078125, -0.0019121170043945312, -0.0015659332275390625, -0.0012197494506835938, -0.000873565673828125, -0.0005273818969726562, -0.0001811981201171875, 0.00016498565673828125, 0.00051116943359375, 0.0008573532104492188, 0.0012035369873046875, 0.0015497207641601562, 0.001895904541015625, 0.0022420883178710938, 0.0025882720947265625, 0.0029344558715820312, 0.0032806396484375, 0.0036268234252929688, 0.0039730072021484375, 0.004319190979003906, 0.004665374755859375, 0.005011558532714844, 0.0053577423095703125, 0.005703926086425781, 0.00605010986328125, 0.006396293640136719, 0.0067424774169921875, 0.007088661193847656, 0.007434844970703125, 0.007781028747558594, 0.008127212524414062, 0.008473396301269531, 0.008819580078125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 12.0, 41.0, 101.0, 231.0, 297.0, 224.0, 58.0, 17.0, 8.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053975556045770645, -0.05155741423368454, -0.04913927614688873, -0.04672113433480263, -0.04430299252271652, -0.04188485071063042, -0.03946670889854431, -0.037048570811748505, -0.0346304289996624, -0.032212287187576294, -0.029794147238135338, -0.02737600728869438, -0.024957865476608276, -0.02253972366452217, -0.020121583715081215, -0.01770344376564026, -0.015285301953554153, -0.012867161072790623, -0.010449020192027092, -0.008030879311263561, -0.0056127384305000305, -0.0031945975497365, -0.0007764566689729691, 0.001641683280467987, 0.004059825092554092, 0.006477965973317623, 0.008896106854081154, 0.011314247734844685, 0.013732388615608215, 0.01615053042769432, 0.018568670377135277, 0.020986810326576233, 0.023404955863952637, 0.025823097676038742, 0.028241237625479698, 0.030659377574920654, 0.03307751938700676, 0.035495661199092865, 0.03791379928588867, 0.04033194109797478, 0.04275008291006088, 0.04516822472214699, 0.04758636653423309, 0.0500045046210289, 0.052422646433115005, 0.05484078824520111, 0.05725892633199692, 0.05967706814408302, 0.06209520995616913, 0.06451334804296494, 0.06693149358034134, 0.06934963166713715, 0.07176777720451355, 0.07418591529130936, 0.07660405337810516, 0.07902219891548157, 0.08144033700227737, 0.08385847508907318, 0.08627662062644958, 0.08869475871324539, 0.0911128968000412, 0.0935310423374176, 0.09594918042421341, 0.09836731851100922, 0.10078546404838562]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 6.0, 7.0, 32.0, 13.0, 21.0, 26.0, 40.0, 37.0, 40.0, 58.0, 63.0, 51.0, 77.0, 77.0, 74.0, 62.0, 84.0, 44.0, 37.0, 34.0, 21.0, 23.0, 23.0, 11.0, 12.0, 7.0, 8.0, 4.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.036922574043273926, -0.035993389785289764, -0.0350642092525959, -0.03413502871990204, -0.03320584446191788, -0.032276660203933716, -0.03134747967123985, -0.03041829727590084, -0.02948911488056183, -0.028559932485222816, -0.027630750089883804, -0.026701567694544792, -0.02577238529920578, -0.024843202903866768, -0.023914020508527756, -0.022984838113188744, -0.02205565571784973, -0.02112647332251072, -0.020197290927171707, -0.019268108531832695, -0.018338926136493683, -0.01740974374115467, -0.01648056134581566, -0.015551378950476646, -0.014622196555137634, -0.013693014159798622, -0.01276383176445961, -0.011834649369120598, -0.010905466973781586, -0.009976284578442574, -0.009047102183103561, -0.00811791978776455, -0.007188737392425537, -0.006259554997086525, -0.005330372601747513, -0.004401190206408501, -0.0034720078110694885, -0.0025428254157304764, -0.0016136430203914642, -0.0006844606250524521, 0.00024472177028656006, 0.0011739041656255722, 0.0021030865609645844, 0.0030322689563035965, 0.003961451351642609, 0.004890633746981621, 0.005819816142320633, 0.006748998537659645, 0.007678180932998657, 0.00860736332833767, 0.009536545723676682, 0.010465728119015694, 0.011394910514354706, 0.012324092909693718, 0.01325327530503273, 0.014182457700371742, 0.015111640095710754, 0.016040822491049767, 0.01697000488638878, 0.01789918728172779, 0.018828369677066803, 0.019757552072405815, 0.020686734467744827, 0.02161591686308384, 0.02254509925842285]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 7.0, 8.0, 5.0, 11.0, 12.0, 18.0, 14.0, 36.0, 42.0, 74.0, 67.0, 146.0, 192.0, 298.0, 504.0, 799.0, 2368.0, 14904.0, 452558.0, 554045.0, 17541.0, 2559.0, 963.0, 481.0, 296.0, 177.0, 108.0, 91.0, 72.0, 46.0, 30.0, 21.0, 12.0, 11.0, 15.0, 9.0, 8.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.032623291015625, -0.0316920280456543, -0.030760765075683594, -0.02982950210571289, -0.028898239135742188, -0.027966976165771484, -0.02703571319580078, -0.026104450225830078, -0.025173187255859375, -0.024241924285888672, -0.02331066131591797, -0.022379398345947266, -0.021448135375976562, -0.02051687240600586, -0.019585609436035156, -0.018654346466064453, -0.01772308349609375, -0.016791820526123047, -0.015860557556152344, -0.01492929458618164, -0.013998031616210938, -0.013066768646240234, -0.012135505676269531, -0.011204242706298828, -0.010272979736328125, -0.009341716766357422, -0.008410453796386719, -0.007479190826416016, -0.0065479278564453125, -0.005616664886474609, -0.004685401916503906, -0.003754138946533203, -0.0028228759765625, -0.0018916130065917969, -0.0009603500366210938, -2.9087066650390625e-05, 0.0009021759033203125, 0.0018334388732910156, 0.0027647018432617188, 0.003695964813232422, 0.004627227783203125, 0.005558490753173828, 0.006489753723144531, 0.007421016693115234, 0.008352279663085938, 0.00928354263305664, 0.010214805603027344, 0.011146068572998047, 0.01207733154296875, 0.013008594512939453, 0.013939857482910156, 0.01487112045288086, 0.015802383422851562, 0.016733646392822266, 0.01766490936279297, 0.018596172332763672, 0.019527435302734375, 0.020458698272705078, 0.02138996124267578, 0.022321224212646484, 0.023252487182617188, 0.02418375015258789, 0.025115013122558594, 0.026046276092529297, 0.0269775390625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 61.0, 212.0, 365.0, 255.0, 88.0, 17.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02166748046875, -0.021133899688720703, -0.020600318908691406, -0.02006673812866211, -0.019533157348632812, -0.018999576568603516, -0.01846599578857422, -0.017932415008544922, -0.017398834228515625, -0.016865253448486328, -0.01633167266845703, -0.015798091888427734, -0.015264511108398438, -0.01473093032836914, -0.014197349548339844, -0.013663768768310547, -0.01313018798828125, -0.012596607208251953, -0.012063026428222656, -0.01152944564819336, -0.010995864868164062, -0.010462284088134766, -0.009928703308105469, -0.009395122528076172, -0.008861541748046875, -0.008327960968017578, -0.007794380187988281, -0.007260799407958984, -0.0067272186279296875, -0.006193637847900391, -0.005660057067871094, -0.005126476287841797, -0.0045928955078125, -0.004059314727783203, -0.0035257339477539062, -0.0029921531677246094, -0.0024585723876953125, -0.0019249916076660156, -0.0013914108276367188, -0.0008578300476074219, -0.000324249267578125, 0.00020933151245117188, 0.0007429122924804688, 0.0012764930725097656, 0.0018100738525390625, 0.0023436546325683594, 0.0028772354125976562, 0.003410816192626953, 0.00394439697265625, 0.004477977752685547, 0.005011558532714844, 0.005545139312744141, 0.0060787200927734375, 0.006612300872802734, 0.007145881652832031, 0.007679462432861328, 0.008213043212890625, 0.008746623992919922, 0.009280204772949219, 0.009813785552978516, 0.010347366333007812, 0.01088094711303711, 0.011414527893066406, 0.011948108673095703, 0.012481689453125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 10.0, 13.0, 15.0, 14.0, 24.0, 31.0, 50.0, 95.0, 138.0, 189.0, 311.0, 542.0, 972.0, 1748.0, 3747.0, 8314.0, 21200.0, 68701.0, 277518.0, 461586.0, 140464.0, 38337.0, 13235.0, 5442.0, 2665.0, 1330.0, 693.0, 424.0, 217.0, 182.0, 107.0, 64.0, 51.0, 32.0, 29.0, 16.0, 8.0, 14.0, 2.0, 3.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01136016845703125, -0.011008024215698242, -0.010655879974365234, -0.010303735733032227, -0.009951591491699219, -0.009599447250366211, -0.009247303009033203, -0.008895158767700195, -0.008543014526367188, -0.00819087028503418, -0.007838726043701172, -0.007486581802368164, -0.007134437561035156, -0.0067822933197021484, -0.006430149078369141, -0.006078004837036133, -0.005725860595703125, -0.005373716354370117, -0.005021572113037109, -0.0046694278717041016, -0.004317283630371094, -0.003965139389038086, -0.003612995147705078, -0.0032608509063720703, -0.0029087066650390625, -0.0025565624237060547, -0.002204418182373047, -0.001852273941040039, -0.0015001296997070312, -0.0011479854583740234, -0.0007958412170410156, -0.0004436969757080078, -9.1552734375e-05, 0.0002605915069580078, 0.0006127357482910156, 0.0009648799896240234, 0.0013170242309570312, 0.001669168472290039, 0.002021312713623047, 0.0023734569549560547, 0.0027256011962890625, 0.0030777454376220703, 0.003429889678955078, 0.003782033920288086, 0.004134178161621094, 0.0044863224029541016, 0.004838466644287109, 0.005190610885620117, 0.005542755126953125, 0.005894899368286133, 0.006247043609619141, 0.0065991878509521484, 0.006951332092285156, 0.007303476333618164, 0.007655620574951172, 0.00800776481628418, 0.008359909057617188, 0.008712053298950195, 0.009064197540283203, 0.009416341781616211, 0.009768486022949219, 0.010120630264282227, 0.010472774505615234, 0.010824918746948242, 0.01117706298828125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 4.0, 15.0, 17.0, 9.0, 27.0, 25.0, 37.0, 47.0, 54.0, 63.0, 62.0, 72.0, 78.0, 74.0, 71.0, 67.0, 65.0, 54.0, 32.0, 26.0, 24.0, 11.0, 5.0, 10.0, 7.0, 8.0, 7.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016632080078125, -0.016149520874023438, -0.015666961669921875, -0.015184402465820312, -0.01470184326171875, -0.014219284057617188, -0.013736724853515625, -0.013254165649414062, -0.0127716064453125, -0.012289047241210938, -0.011806488037109375, -0.011323928833007812, -0.01084136962890625, -0.010358810424804688, -0.009876251220703125, -0.009393692016601562, -0.0089111328125, -0.008428573608398438, -0.007946014404296875, -0.0074634552001953125, -0.00698089599609375, -0.0064983367919921875, -0.006015777587890625, -0.0055332183837890625, -0.0050506591796875, -0.0045680999755859375, -0.004085540771484375, -0.0036029815673828125, -0.00312042236328125, -0.0026378631591796875, -0.002155303955078125, -0.0016727447509765625, -0.001190185546875, -0.0007076263427734375, -0.000225067138671875, 0.0002574920654296875, 0.00074005126953125, 0.0012226104736328125, 0.001705169677734375, 0.0021877288818359375, 0.0026702880859375, 0.0031528472900390625, 0.003635406494140625, 0.0041179656982421875, 0.00460052490234375, 0.0050830841064453125, 0.005565643310546875, 0.0060482025146484375, 0.00653076171875, 0.0070133209228515625, 0.007495880126953125, 0.007978439331054688, 0.00846099853515625, 0.008943557739257812, 0.009426116943359375, 0.009908676147460938, 0.0103912353515625, 0.010873794555664062, 0.011356353759765625, 0.011838912963867188, 0.01232147216796875, 0.012804031372070312, 0.013286590576171875, 0.013769149780273438, 0.014251708984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 15.0, 9.0, 20.0, 24.0, 41.0, 62.0, 85.0, 144.0, 234.0, 321.0, 534.0, 887.0, 1506.0, 2475.0, 4296.0, 7873.0, 14942.0, 29755.0, 64495.0, 159312.0, 387276.0, 215127.0, 82049.0, 37061.0, 18071.0, 9420.0, 5237.0, 2857.0, 1746.0, 979.0, 617.0, 373.0, 276.0, 145.0, 95.0, 75.0, 34.0, 27.0, 24.0, 14.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00337982177734375, -0.00327301025390625, -0.00316619873046875, -0.00305938720703125, -0.00295257568359375, -0.00284576416015625, -0.00273895263671875, -0.00263214111328125, -0.00252532958984375, -0.00241851806640625, -0.00231170654296875, -0.00220489501953125, -0.00209808349609375, -0.00199127197265625, -0.00188446044921875, -0.00177764892578125, -0.00167083740234375, -0.00156402587890625, -0.00145721435546875, -0.00135040283203125, -0.00124359130859375, -0.00113677978515625, -0.00102996826171875, -0.00092315673828125, -0.00081634521484375, -0.00070953369140625, -0.00060272216796875, -0.00049591064453125, -0.00038909912109375, -0.00028228759765625, -0.00017547607421875, -6.866455078125e-05, 3.814697265625e-05, 0.00014495849609375, 0.00025177001953125, 0.00035858154296875, 0.00046539306640625, 0.00057220458984375, 0.00067901611328125, 0.00078582763671875, 0.00089263916015625, 0.00099945068359375, 0.00110626220703125, 0.00121307373046875, 0.00131988525390625, 0.00142669677734375, 0.00153350830078125, 0.00164031982421875, 0.00174713134765625, 0.00185394287109375, 0.00196075439453125, 0.00206756591796875, 0.00217437744140625, 0.00228118896484375, 0.00238800048828125, 0.00249481201171875, 0.00260162353515625, 0.00270843505859375, 0.00281524658203125, 0.00292205810546875, 0.00302886962890625, 0.00313568115234375, 0.00324249267578125, 0.00334930419921875, 0.00345611572265625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 7.0, 11.0, 6.0, 5.0, 11.0, 8.0, 18.0, 14.0, 33.0, 40.0, 48.0, 58.0, 83.0, 106.0, 91.0, 106.0, 77.0, 70.0, 49.0, 35.0, 32.0, 15.0, 23.0, 8.0, 10.0, 8.0, 5.0, 2.0, 3.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.524822235107422e-05, -9.22931358218193e-05, -8.933804929256439e-05, -8.638296276330948e-05, -8.342787623405457e-05, -8.047278970479965e-05, -7.751770317554474e-05, -7.456261664628983e-05, -7.160753011703491e-05, -6.865244358778e-05, -6.569735705852509e-05, -6.274227052927017e-05, -5.978718400001526e-05, -5.6832097470760345e-05, -5.387701094150543e-05, -5.092192441225052e-05, -4.7966837882995605e-05, -4.501175135374069e-05, -4.205666482448578e-05, -3.9101578295230865e-05, -3.614649176597595e-05, -3.319140523672104e-05, -3.0236318707466125e-05, -2.7281232178211212e-05, -2.43261456489563e-05, -2.1371059119701385e-05, -1.8415972590446472e-05, -1.546088606119156e-05, -1.2505799531936646e-05, -9.550713002681732e-06, -6.595626473426819e-06, -3.6405399441719055e-06, -6.854534149169922e-07, 2.269633114337921e-06, 5.2247196435928345e-06, 8.179806172847748e-06, 1.1134892702102661e-05, 1.4089979231357574e-05, 1.7045065760612488e-05, 2.00001522898674e-05, 2.2955238819122314e-05, 2.5910325348377228e-05, 2.886541187763214e-05, 3.1820498406887054e-05, 3.477558493614197e-05, 3.773067146539688e-05, 4.0685757994651794e-05, 4.364084452390671e-05, 4.659593105316162e-05, 4.9551017582416534e-05, 5.250610411167145e-05, 5.546119064092636e-05, 5.8416277170181274e-05, 6.137136369943619e-05, 6.43264502286911e-05, 6.728153675794601e-05, 7.023662328720093e-05, 7.319170981645584e-05, 7.614679634571075e-05, 7.910188287496567e-05, 8.205696940422058e-05, 8.50120559334755e-05, 8.796714246273041e-05, 9.092222899198532e-05, 9.387731552124023e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 10.0, 7.0, 3.0, 12.0, 17.0, 27.0, 29.0, 52.0, 75.0, 135.0, 228.0, 439.0, 723.0, 1340.0, 2811.0, 5913.0, 13200.0, 33579.0, 96547.0, 412149.0, 344445.0, 84174.0, 29790.0, 12007.0, 5224.0, 2594.0, 1357.0, 724.0, 392.0, 227.0, 109.0, 76.0, 51.0, 30.0, 24.0, 14.0, 8.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.006053924560546875, -0.005885481834411621, -0.005717039108276367, -0.005548596382141113, -0.005380153656005859, -0.0052117109298706055, -0.0050432682037353516, -0.004874825477600098, -0.004706382751464844, -0.00453794002532959, -0.004369497299194336, -0.004201054573059082, -0.004032611846923828, -0.0038641691207885742, -0.0036957263946533203, -0.0035272836685180664, -0.0033588409423828125, -0.0031903982162475586, -0.0030219554901123047, -0.0028535127639770508, -0.002685070037841797, -0.002516627311706543, -0.002348184585571289, -0.002179741859436035, -0.0020112991333007812, -0.0018428564071655273, -0.0016744136810302734, -0.0015059709548950195, -0.0013375282287597656, -0.0011690855026245117, -0.0010006427764892578, -0.0008322000503540039, -0.00066375732421875, -0.0004953145980834961, -0.0003268718719482422, -0.00015842914581298828, 1.0013580322265625e-05, 0.00017845630645751953, 0.00034689903259277344, 0.0005153417587280273, 0.0006837844848632812, 0.0008522272109985352, 0.001020669937133789, 0.001189112663269043, 0.0013575553894042969, 0.0015259981155395508, 0.0016944408416748047, 0.0018628835678100586, 0.0020313262939453125, 0.0021997690200805664, 0.0023682117462158203, 0.0025366544723510742, 0.002705097198486328, 0.002873539924621582, 0.003041982650756836, 0.00321042537689209, 0.0033788681030273438, 0.0035473108291625977, 0.0037157535552978516, 0.0038841962814331055, 0.004052639007568359, 0.004221081733703613, 0.004389524459838867, 0.004557967185974121, 0.004726409912109375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 10.0, 13.0, 12.0, 15.0, 28.0, 25.0, 36.0, 50.0, 53.0, 85.0, 110.0, 137.0, 104.0, 73.0, 71.0, 33.0, 29.0, 31.0, 19.0, 9.0, 14.0, 8.0, 7.0, 5.0, 2.0, 3.0, 1.0, 4.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005950927734375, -0.0057675838470458984, -0.005584239959716797, -0.005400896072387695, -0.005217552185058594, -0.005034208297729492, -0.004850864410400391, -0.004667520523071289, -0.0044841766357421875, -0.004300832748413086, -0.004117488861083984, -0.003934144973754883, -0.0037508010864257812, -0.0035674571990966797, -0.003384113311767578, -0.0032007694244384766, -0.003017425537109375, -0.0028340816497802734, -0.002650737762451172, -0.0024673938751220703, -0.0022840499877929688, -0.002100706100463867, -0.0019173622131347656, -0.001734018325805664, -0.0015506744384765625, -0.001367330551147461, -0.0011839866638183594, -0.0010006427764892578, -0.0008172988891601562, -0.0006339550018310547, -0.0004506111145019531, -0.00026726722717285156, -8.392333984375e-05, 9.942054748535156e-05, 0.0002827644348144531, 0.0004661083221435547, 0.0006494522094726562, 0.0008327960968017578, 0.0010161399841308594, 0.001199483871459961, 0.0013828277587890625, 0.001566171646118164, 0.0017495155334472656, 0.0019328594207763672, 0.0021162033081054688, 0.0022995471954345703, 0.002482891082763672, 0.0026662349700927734, 0.002849578857421875, 0.0030329227447509766, 0.003216266632080078, 0.0033996105194091797, 0.0035829544067382812, 0.003766298294067383, 0.003949642181396484, 0.004132986068725586, 0.0043163299560546875, 0.004499673843383789, 0.004683017730712891, 0.004866361618041992, 0.005049705505371094, 0.005233049392700195, 0.005416393280029297, 0.0055997371673583984, 0.0057830810546875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 12.0, 21.0, 33.0, 87.0, 120.0, 157.0, 176.0, 142.0, 96.0, 59.0, 38.0, 18.0, 10.0, 5.0, 9.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08763383328914642, -0.08541546761989594, -0.08319710940122604, -0.08097874373197556, -0.07876038551330566, -0.07654201984405518, -0.07432366162538528, -0.0721052959561348, -0.0698869377374649, -0.06766857206821442, -0.06545021384954453, -0.06323184818029404, -0.061013489961624146, -0.05879512429237366, -0.05657676234841347, -0.05435840040445328, -0.05214003473520279, -0.0499216727912426, -0.04770331084728241, -0.04548494890332222, -0.04326658695936203, -0.04104822129011154, -0.03882985934615135, -0.03661149740219116, -0.03439313545823097, -0.03217477351427078, -0.029956411570310593, -0.027738047763705254, -0.025519685819745064, -0.023301323875784874, -0.021082960069179535, -0.018864598125219345, -0.016646236181259155, -0.014427874237298965, -0.012209511362016201, -0.009991148486733437, -0.007772786542773247, -0.005554424598813057, -0.0033360617235302925, -0.001117698848247528, 0.0011006630957126617, 0.003319025505334139, 0.005537387914955616, 0.007755750324577093, 0.00997411273419857, 0.01219247467815876, 0.014410837553441525, 0.01662920042872429, 0.01884756237268448, 0.02106592431664467, 0.02328428626060486, 0.025502650067210197, 0.027721012011170387, 0.029939373955130577, 0.032157737761735916, 0.034376099705696106, 0.036594461649656296, 0.038812823593616486, 0.041031185537576675, 0.043249547481536865, 0.045467913150787354, 0.047686271369457245, 0.04990463703870773, 0.05212299898266792, 0.05434136092662811]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 11.0, 2.0, 10.0, 13.0, 16.0, 12.0, 13.0, 7.0, 24.0, 25.0, 20.0, 25.0, 27.0, 41.0, 29.0, 40.0, 36.0, 38.0, 34.0, 36.0, 37.0, 37.0, 39.0, 28.0, 39.0, 38.0, 32.0, 41.0, 28.0, 36.0, 29.0, 21.0, 18.0, 17.0, 23.0, 12.0, 12.0, 12.0, 10.0, 7.0, 6.0, 6.0, 3.0, 3.0, 2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025050997734069824, -0.024188131093978882, -0.02332526259124279, -0.0224623940885067, -0.021599527448415756, -0.020736660808324814, -0.019873792305588722, -0.01901092380285263, -0.018148057162761688, -0.017285190522670746, -0.016422322019934654, -0.015559454448521137, -0.01469658687710762, -0.013833719305694103, -0.012970851734280586, -0.01210798416286707, -0.011245116591453552, -0.010382249020040035, -0.009519381448626518, -0.008656513877213001, -0.007793646305799484, -0.006930778734385967, -0.00606791116297245, -0.005205043591558933, -0.004342176020145416, -0.0034793084487318993, -0.0026164408773183823, -0.0017535733059048653, -0.0008907057344913483, -2.783816307783127e-05, 0.0008350294083356857, 0.0016978969797492027, 0.0025607645511627197, 0.0034236321225762367, 0.004286499693989754, 0.005149367265403271, 0.006012234836816788, 0.006875102408230305, 0.007737969979643822, 0.008600837551057339, 0.009463705122470856, 0.010326572693884373, 0.01118944026529789, 0.012052307836711407, 0.012915175408124924, 0.01377804297953844, 0.014640910550951958, 0.015503778122365475, 0.01636664569377899, 0.017229512333869934, 0.018092380836606026, 0.018955249339342117, 0.01981811597943306, 0.020680982619524002, 0.021543851122260094, 0.022406719624996185, 0.023269586265087128, 0.02413245290517807, 0.02499532140791416, 0.025858189910650253, 0.026721056550741196, 0.027583923190832138, 0.02844679169356823, 0.02930966019630432, 0.030172526836395264]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0, 4.0, 1.0, 9.0, 9.0, 8.0, 8.0, 7.0, 24.0, 31.0, 34.0, 86.0, 102.0, 176.0, 285.0, 862.0, 4357.0, 43624.0, 3956158.0, 176826.0, 8067.0, 1951.0, 934.0, 430.0, 145.0, 72.0, 27.0, 19.0, 9.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219879150390625, -0.021335124969482422, -0.020682334899902344, -0.020029544830322266, -0.019376754760742188, -0.01872396469116211, -0.01807117462158203, -0.017418384552001953, -0.016765594482421875, -0.016112804412841797, -0.015460014343261719, -0.01480722427368164, -0.014154434204101562, -0.013501644134521484, -0.012848854064941406, -0.012196063995361328, -0.01154327392578125, -0.010890483856201172, -0.010237693786621094, -0.009584903717041016, -0.008932113647460938, -0.00827932357788086, -0.007626533508300781, -0.006973743438720703, -0.006320953369140625, -0.005668163299560547, -0.005015373229980469, -0.004362583160400391, -0.0037097930908203125, -0.0030570030212402344, -0.0024042129516601562, -0.0017514228820800781, -0.0010986328125, -0.0004458427429199219, 0.00020694732666015625, 0.0008597373962402344, 0.0015125274658203125, 0.0021653175354003906, 0.0028181076049804688, 0.003470897674560547, 0.004123687744140625, 0.004776477813720703, 0.005429267883300781, 0.006082057952880859, 0.0067348480224609375, 0.007387638092041016, 0.008040428161621094, 0.008693218231201172, 0.00934600830078125, 0.009998798370361328, 0.010651588439941406, 0.011304378509521484, 0.011957168579101562, 0.01260995864868164, 0.013262748718261719, 0.013915538787841797, 0.014568328857421875, 0.015221118927001953, 0.01587390899658203, 0.01652669906616211, 0.017179489135742188, 0.017832279205322266, 0.018485069274902344, 0.019137859344482422, 0.0197906494140625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 10.0, 45.0, 159.0, 332.0, 285.0, 135.0, 36.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02215576171875, -0.021626949310302734, -0.02109813690185547, -0.020569324493408203, -0.020040512084960938, -0.019511699676513672, -0.018982887268066406, -0.01845407485961914, -0.017925262451171875, -0.01739645004272461, -0.016867637634277344, -0.016338825225830078, -0.015810012817382812, -0.015281200408935547, -0.014752388000488281, -0.014223575592041016, -0.01369476318359375, -0.013165950775146484, -0.012637138366699219, -0.012108325958251953, -0.011579513549804688, -0.011050701141357422, -0.010521888732910156, -0.00999307632446289, -0.009464263916015625, -0.00893545150756836, -0.008406639099121094, -0.007877826690673828, -0.0073490142822265625, -0.006820201873779297, -0.006291389465332031, -0.005762577056884766, -0.0052337646484375, -0.004704952239990234, -0.004176139831542969, -0.003647327423095703, -0.0031185150146484375, -0.002589702606201172, -0.0020608901977539062, -0.0015320777893066406, -0.001003265380859375, -0.0004744529724121094, 5.435943603515625e-05, 0.0005831718444824219, 0.0011119842529296875, 0.0016407966613769531, 0.0021696090698242188, 0.0026984214782714844, 0.00322723388671875, 0.0037560462951660156, 0.004284858703613281, 0.004813671112060547, 0.0053424835205078125, 0.005871295928955078, 0.006400108337402344, 0.006928920745849609, 0.007457733154296875, 0.00798654556274414, 0.008515357971191406, 0.009044170379638672, 0.009572982788085938, 0.010101795196533203, 0.010630607604980469, 0.011159420013427734, 0.011688232421875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 3.0, 2.0, 4.0, 9.0, 9.0, 6.0, 20.0, 20.0, 49.0, 71.0, 95.0, 158.0, 291.0, 480.0, 884.0, 1769.0, 4042.0, 12253.0, 51528.0, 451666.0, 3444934.0, 181988.0, 29738.0, 8200.0, 2989.0, 1324.0, 706.0, 404.0, 221.0, 153.0, 88.0, 51.0, 45.0, 21.0, 15.0, 9.0, 7.0, 3.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0], "bins": [-0.0119476318359375, -0.011618733406066895, -0.011289834976196289, -0.010960936546325684, -0.010632038116455078, -0.010303139686584473, -0.009974241256713867, -0.009645342826843262, -0.009316444396972656, -0.00898754596710205, -0.008658647537231445, -0.00832974910736084, -0.008000850677490234, -0.007671952247619629, -0.0073430538177490234, -0.007014155387878418, -0.0066852569580078125, -0.006356358528137207, -0.0060274600982666016, -0.005698561668395996, -0.005369663238525391, -0.005040764808654785, -0.00471186637878418, -0.004382967948913574, -0.004054069519042969, -0.0037251710891723633, -0.003396272659301758, -0.0030673742294311523, -0.002738475799560547, -0.0024095773696899414, -0.002080678939819336, -0.0017517805099487305, -0.001422882080078125, -0.0010939836502075195, -0.0007650852203369141, -0.0004361867904663086, -0.00010728836059570312, 0.00022161006927490234, 0.0005505084991455078, 0.0008794069290161133, 0.0012083053588867188, 0.0015372037887573242, 0.0018661022186279297, 0.002195000648498535, 0.0025238990783691406, 0.002852797508239746, 0.0031816959381103516, 0.003510594367980957, 0.0038394927978515625, 0.004168391227722168, 0.0044972896575927734, 0.004826188087463379, 0.005155086517333984, 0.00548398494720459, 0.005812883377075195, 0.006141781806945801, 0.006470680236816406, 0.006799578666687012, 0.007128477096557617, 0.007457375526428223, 0.007786273956298828, 0.008115172386169434, 0.008444070816040039, 0.008772969245910645, 0.00910186767578125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 3.0, 4.0, 7.0, 5.0, 14.0, 24.0, 31.0, 30.0, 50.0, 83.0, 180.0, 462.0, 1265.0, 1046.0, 387.0, 185.0, 102.0, 63.0, 41.0, 25.0, 24.0, 9.0, 11.0, 8.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0100250244140625, -0.00971066951751709, -0.00939631462097168, -0.00908195972442627, -0.00876760482788086, -0.00845324993133545, -0.008138895034790039, -0.007824540138244629, -0.007510185241699219, -0.007195830345153809, -0.0068814754486083984, -0.006567120552062988, -0.006252765655517578, -0.005938410758972168, -0.005624055862426758, -0.005309700965881348, -0.0049953460693359375, -0.004680991172790527, -0.004366636276245117, -0.004052281379699707, -0.003737926483154297, -0.0034235715866088867, -0.0031092166900634766, -0.0027948617935180664, -0.0024805068969726562, -0.002166152000427246, -0.001851797103881836, -0.0015374422073364258, -0.0012230873107910156, -0.0009087324142456055, -0.0005943775177001953, -0.00028002262115478516, 3.4332275390625e-05, 0.00034868717193603516, 0.0006630420684814453, 0.0009773969650268555, 0.0012917518615722656, 0.0016061067581176758, 0.001920461654663086, 0.002234816551208496, 0.0025491714477539062, 0.0028635263442993164, 0.0031778812408447266, 0.0034922361373901367, 0.003806591033935547, 0.004120945930480957, 0.004435300827026367, 0.004749655723571777, 0.0050640106201171875, 0.005378365516662598, 0.005692720413208008, 0.006007075309753418, 0.006321430206298828, 0.006635785102844238, 0.0069501399993896484, 0.007264494895935059, 0.007578849792480469, 0.007893204689025879, 0.008207559585571289, 0.0085219144821167, 0.00883626937866211, 0.00915062427520752, 0.00946497917175293, 0.00977933406829834, 0.01009368896484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 15.0, 20.0, 44.0, 71.0, 149.0, 197.0, 180.0, 140.0, 75.0, 37.0, 22.0, 19.0, 7.0, 6.0, 3.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06299081444740295, -0.06119625270366669, -0.05940169095993042, -0.057607125490903854, -0.05581256374716759, -0.05401800200343132, -0.05222344025969505, -0.05042887479066849, -0.04863431304693222, -0.04683975130319595, -0.045045189559459686, -0.04325062409043312, -0.041456062346696854, -0.03966150060296059, -0.03786693885922432, -0.036072373390197754, -0.03427781164646149, -0.03248324990272522, -0.030688686296343803, -0.028894124552607536, -0.02709956094622612, -0.025304999202489853, -0.023510437458753586, -0.02171587385237217, -0.01992131397128105, -0.018126752227544785, -0.016332188621163368, -0.014537626877427101, -0.012743063271045685, -0.010948501527309418, -0.009153938852250576, -0.007359376177191734, -0.005564812570810318, -0.0037702498957514763, -0.0019756874535232782, -0.00018112501129508018, 0.0016134376637637615, 0.003407999873161316, 0.005202562548220158, 0.006997125223278999, 0.008791687898337841, 0.010586250573396683, 0.012380813248455524, 0.014175375923514366, 0.015969937667250633, 0.01776450127363205, 0.019559063017368317, 0.021353624761104584, 0.023148188367486, 0.024942750111222267, 0.026737313717603683, 0.02853187546133995, 0.030326439067721367, 0.03212100267410278, 0.03391556441783905, 0.03571012616157532, 0.037504687905311584, 0.03929924964904785, 0.04109381139278412, 0.042888376861810684, 0.04468293860554695, 0.04647750034928322, 0.048272062093019485, 0.05006662756204605, 0.05186118930578232]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 4.0, 9.0, 12.0, 15.0, 17.0, 16.0, 18.0, 21.0, 27.0, 35.0, 30.0, 35.0, 51.0, 53.0, 50.0, 49.0, 45.0, 55.0, 51.0, 49.0, 51.0, 49.0, 35.0, 41.0, 26.0, 28.0, 29.0, 25.0, 18.0, 16.0, 8.0, 7.0, 4.0, 6.0, 5.0, 2.0, 6.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.028220653533935547, -0.027442384511232376, -0.026664113625884056, -0.025885842740535736, -0.025107573717832565, -0.024329304695129395, -0.023551033809781075, -0.022772762924432755, -0.021994493901729584, -0.021216224879026413, -0.020437953993678093, -0.019659683108329773, -0.018881414085626602, -0.01810314506292343, -0.01732487417757511, -0.01654660329222679, -0.01576833426952362, -0.014990064315497875, -0.01421179436147213, -0.013433524407446384, -0.012655254453420639, -0.011876984499394894, -0.011098714545369148, -0.010320444591343403, -0.009542174637317657, -0.008763904683291912, -0.007985634729266167, -0.007207364775240421, -0.006429094821214676, -0.0056508248671889305, -0.004872554913163185, -0.00409428495913744, -0.0033160150051116943, -0.002537745051085949, -0.0017594750970602036, -0.0009812051430344582, -0.00020293518900871277, 0.0005753347650170326, 0.001353604719042778, 0.0021318746730685234, 0.002910144627094269, 0.003688414581120014, 0.00446668453514576, 0.005244954489171505, 0.00602322444319725, 0.006801494397222996, 0.007579764351248741, 0.008358034305274487, 0.009136304259300232, 0.009914574213325977, 0.010692844167351723, 0.011471114121377468, 0.012249384075403214, 0.013027654029428959, 0.013805923983454704, 0.01458419393748045, 0.015362463891506195, 0.016140732914209366, 0.016919003799557686, 0.017697274684906006, 0.018475543707609177, 0.019253812730312347, 0.020032083615660667, 0.020810354501008987, 0.021588623523712158]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 8.0, 7.0, 6.0, 11.0, 12.0, 15.0, 17.0, 18.0, 27.0, 28.0, 47.0, 77.0, 98.0, 136.0, 197.0, 277.0, 450.0, 750.0, 1661.0, 5820.0, 63536.0, 812540.0, 148784.0, 9276.0, 2201.0, 952.0, 503.0, 357.0, 206.0, 148.0, 94.0, 90.0, 45.0, 39.0, 30.0, 13.0, 14.0, 15.0, 7.0, 10.0, 7.0, 8.0, 5.0, 1.0, 5.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0323486328125, -0.03129243850708008, -0.030236244201660156, -0.029180049896240234, -0.028123855590820312, -0.02706766128540039, -0.02601146697998047, -0.024955272674560547, -0.023899078369140625, -0.022842884063720703, -0.02178668975830078, -0.02073049545288086, -0.019674301147460938, -0.018618106842041016, -0.017561912536621094, -0.016505718231201172, -0.01544952392578125, -0.014393329620361328, -0.013337135314941406, -0.012280941009521484, -0.011224746704101562, -0.01016855239868164, -0.009112358093261719, -0.008056163787841797, -0.006999969482421875, -0.005943775177001953, -0.004887580871582031, -0.0038313865661621094, -0.0027751922607421875, -0.0017189979553222656, -0.0006628036499023438, 0.0003933906555175781, 0.0014495849609375, 0.002505779266357422, 0.0035619735717773438, 0.004618167877197266, 0.0056743621826171875, 0.006730556488037109, 0.007786750793457031, 0.008842945098876953, 0.009899139404296875, 0.010955333709716797, 0.012011528015136719, 0.01306772232055664, 0.014123916625976562, 0.015180110931396484, 0.016236305236816406, 0.017292499542236328, 0.01834869384765625, 0.019404888153076172, 0.020461082458496094, 0.021517276763916016, 0.022573471069335938, 0.02362966537475586, 0.02468585968017578, 0.025742053985595703, 0.026798248291015625, 0.027854442596435547, 0.02891063690185547, 0.02996683120727539, 0.031023025512695312, 0.032079219818115234, 0.033135414123535156, 0.03419160842895508, 0.035247802734375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 18.0, 113.0, 273.0, 308.0, 208.0, 70.0, 9.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.022979736328125, -0.02243649959564209, -0.02189326286315918, -0.02135002613067627, -0.02080678939819336, -0.02026355266571045, -0.01972031593322754, -0.01917707920074463, -0.01863384246826172, -0.01809060573577881, -0.0175473690032959, -0.01700413227081299, -0.016460895538330078, -0.015917658805847168, -0.015374422073364258, -0.014831185340881348, -0.014287948608398438, -0.013744711875915527, -0.013201475143432617, -0.012658238410949707, -0.012115001678466797, -0.011571764945983887, -0.011028528213500977, -0.010485291481018066, -0.009942054748535156, -0.009398818016052246, -0.008855581283569336, -0.008312344551086426, -0.007769107818603516, -0.0072258710861206055, -0.006682634353637695, -0.006139397621154785, -0.005596160888671875, -0.005052924156188965, -0.004509687423706055, -0.0039664506912231445, -0.0034232139587402344, -0.0028799772262573242, -0.002336740493774414, -0.001793503761291504, -0.0012502670288085938, -0.0007070302963256836, -0.00016379356384277344, 0.0003794431686401367, 0.0009226799011230469, 0.001465916633605957, 0.002009153366088867, 0.0025523900985717773, 0.0030956268310546875, 0.0036388635635375977, 0.004182100296020508, 0.004725337028503418, 0.005268573760986328, 0.005811810493469238, 0.0063550472259521484, 0.006898283958435059, 0.007441520690917969, 0.007984757423400879, 0.008527994155883789, 0.0090712308883667, 0.00961446762084961, 0.01015770435333252, 0.01070094108581543, 0.01124417781829834, 0.01178741455078125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 7.0, 5.0, 8.0, 21.0, 26.0, 25.0, 38.0, 47.0, 60.0, 118.0, 194.0, 267.0, 443.0, 618.0, 1023.0, 1704.0, 2938.0, 5420.0, 10379.0, 21567.0, 47678.0, 108700.0, 230980.0, 295454.0, 174197.0, 78347.0, 34010.0, 15982.0, 7940.0, 4178.0, 2360.0, 1405.0, 797.0, 563.0, 353.0, 206.0, 168.0, 103.0, 64.0, 47.0, 37.0, 21.0, 22.0, 12.0, 6.0, 4.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.00798797607421875, -0.007732748985290527, -0.007477521896362305, -0.007222294807434082, -0.006967067718505859, -0.006711840629577637, -0.006456613540649414, -0.006201386451721191, -0.005946159362792969, -0.005690932273864746, -0.0054357051849365234, -0.005180478096008301, -0.004925251007080078, -0.0046700239181518555, -0.004414796829223633, -0.00415956974029541, -0.0039043426513671875, -0.003649115562438965, -0.003393888473510742, -0.0031386613845825195, -0.002883434295654297, -0.0026282072067260742, -0.0023729801177978516, -0.002117753028869629, -0.0018625259399414062, -0.0016072988510131836, -0.001352071762084961, -0.0010968446731567383, -0.0008416175842285156, -0.000586390495300293, -0.0003311634063720703, -7.593631744384766e-05, 0.000179290771484375, 0.00043451786041259766, 0.0006897449493408203, 0.000944972038269043, 0.0012001991271972656, 0.0014554262161254883, 0.001710653305053711, 0.0019658803939819336, 0.0022211074829101562, 0.002476334571838379, 0.0027315616607666016, 0.0029867887496948242, 0.003242015838623047, 0.0034972429275512695, 0.003752470016479492, 0.004007697105407715, 0.0042629241943359375, 0.00451815128326416, 0.004773378372192383, 0.0050286054611206055, 0.005283832550048828, 0.005539059638977051, 0.0057942867279052734, 0.006049513816833496, 0.006304740905761719, 0.006559967994689941, 0.006815195083618164, 0.007070422172546387, 0.007325649261474609, 0.007580876350402832, 0.007836103439331055, 0.008091330528259277, 0.0083465576171875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 4.0, 2.0, 4.0, 6.0, 8.0, 8.0, 17.0, 13.0, 9.0, 29.0, 21.0, 35.0, 39.0, 58.0, 44.0, 42.0, 55.0, 57.0, 66.0, 65.0, 61.0, 50.0, 39.0, 46.0, 39.0, 39.0, 30.0, 21.0, 17.0, 21.0, 11.0, 8.0, 13.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0119171142578125, -0.011530041694641113, -0.011142969131469727, -0.01075589656829834, -0.010368824005126953, -0.009981751441955566, -0.00959467887878418, -0.009207606315612793, -0.008820533752441406, -0.00843346118927002, -0.008046388626098633, -0.007659316062927246, -0.007272243499755859, -0.006885170936584473, -0.006498098373413086, -0.006111025810241699, -0.0057239532470703125, -0.005336880683898926, -0.004949808120727539, -0.004562735557556152, -0.004175662994384766, -0.003788590431213379, -0.003401517868041992, -0.0030144453048706055, -0.0026273727416992188, -0.002240300178527832, -0.0018532276153564453, -0.0014661550521850586, -0.0010790824890136719, -0.0006920099258422852, -0.00030493736267089844, 8.213520050048828e-05, 0.000469207763671875, 0.0008562803268432617, 0.0012433528900146484, 0.0016304254531860352, 0.002017498016357422, 0.0024045705795288086, 0.0027916431427001953, 0.003178715705871582, 0.0035657882690429688, 0.0039528608322143555, 0.004339933395385742, 0.004727005958557129, 0.005114078521728516, 0.005501151084899902, 0.005888223648071289, 0.006275296211242676, 0.0066623687744140625, 0.007049441337585449, 0.007436513900756836, 0.007823586463928223, 0.00821065902709961, 0.008597731590270996, 0.008984804153442383, 0.00937187671661377, 0.009758949279785156, 0.010146021842956543, 0.01053309440612793, 0.010920166969299316, 0.011307239532470703, 0.01169431209564209, 0.012081384658813477, 0.012468457221984863, 0.01285552978515625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 7.0, 5.0, 12.0, 15.0, 14.0, 19.0, 27.0, 51.0, 56.0, 81.0, 96.0, 115.0, 191.0, 227.0, 328.0, 441.0, 663.0, 919.0, 1299.0, 1998.0, 3042.0, 5177.0, 10534.0, 24756.0, 71072.0, 233159.0, 426462.0, 172987.0, 53495.0, 19430.0, 8674.0, 4576.0, 2752.0, 1725.0, 1191.0, 790.0, 573.0, 407.0, 302.0, 243.0, 169.0, 130.0, 89.0, 63.0, 48.0, 44.0, 27.0, 22.0, 11.0, 9.0, 10.0, 4.0, 8.0, 6.0, 4.0, 0.0, 5.0, 2.0, 0.0, 1.0], "bins": [-0.004878997802734375, -0.004718363285064697, -0.0045577287673950195, -0.004397094249725342, -0.004236459732055664, -0.004075825214385986, -0.003915190696716309, -0.003754556179046631, -0.003593921661376953, -0.0034332871437072754, -0.0032726526260375977, -0.00311201810836792, -0.002951383590698242, -0.0027907490730285645, -0.0026301145553588867, -0.002469480037689209, -0.0023088455200195312, -0.0021482110023498535, -0.0019875764846801758, -0.001826941967010498, -0.0016663074493408203, -0.0015056729316711426, -0.0013450384140014648, -0.0011844038963317871, -0.0010237693786621094, -0.0008631348609924316, -0.0007025003433227539, -0.0005418658256530762, -0.00038123130798339844, -0.0002205967903137207, -5.996227264404297e-05, 0.00010067224502563477, 0.0002613067626953125, 0.00042194128036499023, 0.000582575798034668, 0.0007432103157043457, 0.0009038448333740234, 0.0010644793510437012, 0.001225113868713379, 0.0013857483863830566, 0.0015463829040527344, 0.0017070174217224121, 0.0018676519393920898, 0.0020282864570617676, 0.0021889209747314453, 0.002349555492401123, 0.0025101900100708008, 0.0026708245277404785, 0.0028314590454101562, 0.002992093563079834, 0.0031527280807495117, 0.0033133625984191895, 0.003473997116088867, 0.003634631633758545, 0.0037952661514282227, 0.0039559006690979, 0.004116535186767578, 0.004277169704437256, 0.004437804222106934, 0.004598438739776611, 0.004759073257446289, 0.004919707775115967, 0.0050803422927856445, 0.005240976810455322, 0.005401611328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 7.0, 2.0, 3.0, 6.0, 6.0, 13.0, 9.0, 7.0, 17.0, 22.0, 22.0, 33.0, 28.0, 40.0, 56.0, 61.0, 80.0, 70.0, 95.0, 86.0, 66.0, 44.0, 43.0, 31.0, 27.0, 25.0, 20.0, 12.0, 12.0, 5.0, 6.0, 7.0, 8.0, 0.0, 4.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.778406143188477e-05, -7.53672793507576e-05, -7.295049726963043e-05, -7.053371518850327e-05, -6.81169331073761e-05, -6.570015102624893e-05, -6.328336894512177e-05, -6.08665868639946e-05, -5.844980478286743e-05, -5.6033022701740265e-05, -5.36162406206131e-05, -5.119945853948593e-05, -4.8782676458358765e-05, -4.63658943772316e-05, -4.394911229610443e-05, -4.1532330214977264e-05, -3.91155481338501e-05, -3.669876605272293e-05, -3.4281983971595764e-05, -3.18652018904686e-05, -2.944841980934143e-05, -2.7031637728214264e-05, -2.4614855647087097e-05, -2.219807356595993e-05, -1.9781291484832764e-05, -1.7364509403705597e-05, -1.494772732257843e-05, -1.2530945241451263e-05, -1.0114163160324097e-05, -7.69738107919693e-06, -5.280598998069763e-06, -2.8638169169425964e-06, -4.470348358154297e-07, 1.969747245311737e-06, 4.386529326438904e-06, 6.8033114075660706e-06, 9.220093488693237e-06, 1.1636875569820404e-05, 1.405365765094757e-05, 1.6470439732074738e-05, 1.8887221813201904e-05, 2.130400389432907e-05, 2.3720785975456238e-05, 2.6137568056583405e-05, 2.855435013771057e-05, 3.097113221883774e-05, 3.3387914299964905e-05, 3.580469638109207e-05, 3.822147846221924e-05, 4.0638260543346405e-05, 4.305504262447357e-05, 4.547182470560074e-05, 4.7888606786727905e-05, 5.030538886785507e-05, 5.272217094898224e-05, 5.5138953030109406e-05, 5.755573511123657e-05, 5.997251719236374e-05, 6.23892992734909e-05, 6.480608135461807e-05, 6.722286343574524e-05, 6.96396455168724e-05, 7.205642759799957e-05, 7.447320967912674e-05, 7.68899917602539e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 12.0, 24.0, 39.0, 47.0, 69.0, 89.0, 135.0, 206.0, 329.0, 536.0, 844.0, 1418.0, 2640.0, 5600.0, 14818.0, 57528.0, 347743.0, 497471.0, 84663.0, 20001.0, 7050.0, 3056.0, 1621.0, 914.0, 574.0, 335.0, 262.0, 162.0, 110.0, 84.0, 46.0, 23.0, 19.0, 26.0, 12.0, 9.0, 8.0, 4.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00800323486328125, -0.007737517356872559, -0.007471799850463867, -0.007206082344055176, -0.006940364837646484, -0.006674647331237793, -0.0064089298248291016, -0.00614321231842041, -0.005877494812011719, -0.005611777305603027, -0.005346059799194336, -0.0050803422927856445, -0.004814624786376953, -0.004548907279968262, -0.00428318977355957, -0.004017472267150879, -0.0037517547607421875, -0.003486037254333496, -0.0032203197479248047, -0.0029546022415161133, -0.002688884735107422, -0.0024231672286987305, -0.002157449722290039, -0.0018917322158813477, -0.0016260147094726562, -0.0013602972030639648, -0.0010945796966552734, -0.000828862190246582, -0.0005631446838378906, -0.0002974271774291992, -3.170967102050781e-05, 0.0002340078353881836, 0.000499725341796875, 0.0007654428482055664, 0.0010311603546142578, 0.0012968778610229492, 0.0015625953674316406, 0.001828312873840332, 0.0020940303802490234, 0.002359747886657715, 0.0026254653930664062, 0.0028911828994750977, 0.003156900405883789, 0.0034226179122924805, 0.003688335418701172, 0.003954052925109863, 0.004219770431518555, 0.004485487937927246, 0.0047512054443359375, 0.005016922950744629, 0.00528264045715332, 0.005548357963562012, 0.005814075469970703, 0.0060797929763793945, 0.006345510482788086, 0.006611227989196777, 0.006876945495605469, 0.00714266300201416, 0.0074083805084228516, 0.007674098014831543, 0.007939815521240234, 0.008205533027648926, 0.008471250534057617, 0.008736968040466309, 0.009002685546875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 1.0, 4.0, 4.0, 14.0, 13.0, 17.0, 37.0, 61.0, 107.0, 163.0, 167.0, 153.0, 103.0, 65.0, 33.0, 26.0, 7.0, 8.0, 4.0, 0.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.0102081298828125, -0.00989377498626709, -0.00957942008972168, -0.00926506519317627, -0.00895071029663086, -0.00863635540008545, -0.008322000503540039, -0.008007645606994629, -0.007693290710449219, -0.007378935813903809, -0.0070645809173583984, -0.006750226020812988, -0.006435871124267578, -0.006121516227722168, -0.005807161331176758, -0.005492806434631348, -0.0051784515380859375, -0.004864096641540527, -0.004549741744995117, -0.004235386848449707, -0.003921031951904297, -0.0036066770553588867, -0.0032923221588134766, -0.0029779672622680664, -0.0026636123657226562, -0.002349257469177246, -0.002034902572631836, -0.0017205476760864258, -0.0014061927795410156, -0.0010918378829956055, -0.0007774829864501953, -0.00046312808990478516, -0.000148773193359375, 0.00016558170318603516, 0.0004799365997314453, 0.0007942914962768555, 0.0011086463928222656, 0.0014230012893676758, 0.001737356185913086, 0.002051711082458496, 0.0023660659790039062, 0.0026804208755493164, 0.0029947757720947266, 0.0033091306686401367, 0.003623485565185547, 0.003937840461730957, 0.004252195358276367, 0.004566550254821777, 0.0048809051513671875, 0.005195260047912598, 0.005509614944458008, 0.005823969841003418, 0.006138324737548828, 0.006452679634094238, 0.0067670345306396484, 0.007081389427185059, 0.007395744323730469, 0.007710099220275879, 0.008024454116821289, 0.0083388090133667, 0.00865316390991211, 0.00896751880645752, 0.00928187370300293, 0.00959622859954834, 0.00991058349609375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 11.0, 14.0, 21.0, 42.0, 82.0, 104.0, 187.0, 200.0, 149.0, 96.0, 54.0, 22.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1482071429491043, -0.1450713872909546, -0.14193564653396606, -0.13879989087581635, -0.13566413521766663, -0.1325283944606781, -0.12939263880252838, -0.12625688314437866, -0.12312113493680954, -0.11998538672924042, -0.1168496310710907, -0.11371388286352158, -0.11057812720537186, -0.10744237899780273, -0.10430662333965302, -0.10117087513208389, -0.09803512692451477, -0.09489937871694565, -0.09176362305879593, -0.0886278748512268, -0.08549211919307709, -0.08235637098550797, -0.07922062277793884, -0.07608486711978912, -0.0729491114616394, -0.06981336325407028, -0.06667760759592056, -0.06354185938835144, -0.06040610745549202, -0.0572703555226326, -0.05413460358977318, -0.05099885165691376, -0.047863103449344635, -0.044727351516485214, -0.04159159958362579, -0.03845585137605667, -0.03532009944319725, -0.03218434751033783, -0.02904859557747841, -0.025912845507264137, -0.022777093574404716, -0.019641341641545296, -0.016505591571331024, -0.013369839638471603, -0.010234088636934757, -0.007098337635397911, -0.00396258570253849, -0.0008268356323242188, 0.002308916300535202, 0.005444667302072048, 0.008580418303608894, 0.011716170236468315, 0.014851921238005161, 0.017987672239542007, 0.021123424172401428, 0.0242591742426157, 0.02739492617547512, 0.03053067810833454, 0.03366642817854881, 0.036802180111408234, 0.039937932044267654, 0.043073683977127075, 0.0462094321846962, 0.04934518411755562, 0.05248093605041504]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 7.0, 9.0, 10.0, 12.0, 8.0, 7.0, 22.0, 20.0, 22.0, 25.0, 22.0, 29.0, 27.0, 34.0, 45.0, 29.0, 50.0, 52.0, 40.0, 38.0, 36.0, 45.0, 49.0, 40.0, 44.0, 31.0, 32.0, 22.0, 27.0, 29.0, 21.0, 23.0, 14.0, 23.0, 7.0, 12.0, 9.0, 13.0, 6.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028327584266662598, -0.02739134430885315, -0.02645510621368885, -0.02551886811852455, -0.024582628160715103, -0.023646388202905655, -0.022710150107741356, -0.021773912012577057, -0.02083767205476761, -0.01990143209695816, -0.01896519400179386, -0.018028955906629562, -0.017092715948820114, -0.016156475991010666, -0.015220237895846367, -0.014283998869359493, -0.01334775984287262, -0.012411520816385746, -0.011475281789898872, -0.010539042763411999, -0.009602803736925125, -0.008666564710438251, -0.007730325683951378, -0.006794086657464504, -0.005857847630977631, -0.004921608604490757, -0.003985369578003883, -0.0030491305515170097, -0.002112891525030136, -0.0011766524985432625, -0.00024041347205638885, 0.0006958255544304848, 0.0016320645809173584, 0.002568303607404232, 0.0035045426338911057, 0.004440781660377979, 0.005377020686864853, 0.0063132597133517265, 0.0072494987398386, 0.008185737766325474, 0.009121976792812347, 0.010058215819299221, 0.010994454845786095, 0.011930693872272968, 0.012866932898759842, 0.013803171925246716, 0.01473941095173359, 0.015675649046897888, 0.016611889004707336, 0.017548128962516785, 0.018484367057681084, 0.019420605152845383, 0.02035684511065483, 0.02129308506846428, 0.022229323163628578, 0.023165561258792877, 0.024101801216602325, 0.025038041174411774, 0.025974279269576073, 0.02691051736474037, 0.02784675732254982, 0.028782997280359268, 0.029719235375523567, 0.030655473470687866, 0.031591713428497314]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 7.0, 6.0, 12.0, 14.0, 12.0, 19.0, 38.0, 52.0, 66.0, 147.0, 318.0, 1097.0, 6943.0, 96669.0, 4021338.0, 59332.0, 5600.0, 1532.0, 647.0, 229.0, 67.0, 39.0, 26.0, 20.0, 15.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249176025390625, -0.024214506149291992, -0.023511409759521484, -0.022808313369750977, -0.02210521697998047, -0.02140212059020996, -0.020699024200439453, -0.019995927810668945, -0.019292831420898438, -0.01858973503112793, -0.017886638641357422, -0.017183542251586914, -0.016480445861816406, -0.0157773494720459, -0.01507425308227539, -0.014371156692504883, -0.013668060302734375, -0.012964963912963867, -0.01226186752319336, -0.011558771133422852, -0.010855674743652344, -0.010152578353881836, -0.009449481964111328, -0.00874638557434082, -0.008043289184570312, -0.007340192794799805, -0.006637096405029297, -0.005934000015258789, -0.005230903625488281, -0.0045278072357177734, -0.0038247108459472656, -0.003121614456176758, -0.00241851806640625, -0.0017154216766357422, -0.0010123252868652344, -0.00030922889709472656, 0.00039386749267578125, 0.001096963882446289, 0.0018000602722167969, 0.0025031566619873047, 0.0032062530517578125, 0.00390934944152832, 0.004612445831298828, 0.005315542221069336, 0.006018638610839844, 0.0067217350006103516, 0.007424831390380859, 0.008127927780151367, 0.008831024169921875, 0.009534120559692383, 0.01023721694946289, 0.010940313339233398, 0.011643409729003906, 0.012346506118774414, 0.013049602508544922, 0.01375269889831543, 0.014455795288085938, 0.015158891677856445, 0.015861988067626953, 0.01656508445739746, 0.01726818084716797, 0.017971277236938477, 0.018674373626708984, 0.019377470016479492, 0.02008056640625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 100.0, 205.0, 296.0, 249.0, 106.0, 31.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022430419921875, -0.021891355514526367, -0.021352291107177734, -0.0208132266998291, -0.02027416229248047, -0.019735097885131836, -0.019196033477783203, -0.01865696907043457, -0.018117904663085938, -0.017578840255737305, -0.017039775848388672, -0.01650071144104004, -0.015961647033691406, -0.015422582626342773, -0.01488351821899414, -0.014344453811645508, -0.013805389404296875, -0.013266324996948242, -0.01272726058959961, -0.012188196182250977, -0.011649131774902344, -0.011110067367553711, -0.010571002960205078, -0.010031938552856445, -0.009492874145507812, -0.00895380973815918, -0.008414745330810547, -0.007875680923461914, -0.007336616516113281, -0.0067975521087646484, -0.006258487701416016, -0.005719423294067383, -0.00518035888671875, -0.004641294479370117, -0.004102230072021484, -0.0035631656646728516, -0.0030241012573242188, -0.002485036849975586, -0.0019459724426269531, -0.0014069080352783203, -0.0008678436279296875, -0.0003287792205810547, 0.00021028518676757812, 0.0007493495941162109, 0.0012884140014648438, 0.0018274784088134766, 0.0023665428161621094, 0.002905607223510742, 0.003444671630859375, 0.003983736038208008, 0.004522800445556641, 0.0050618648529052734, 0.005600929260253906, 0.006139993667602539, 0.006679058074951172, 0.007218122482299805, 0.0077571868896484375, 0.00829625129699707, 0.008835315704345703, 0.009374380111694336, 0.009913444519042969, 0.010452508926391602, 0.010991573333740234, 0.011530637741088867, 0.0120697021484375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 5.0, 9.0, 11.0, 14.0, 23.0, 26.0, 32.0, 54.0, 95.0, 137.0, 248.0, 468.0, 770.0, 1441.0, 2957.0, 6881.0, 20679.0, 84249.0, 994970.0, 2895058.0, 139707.0, 29373.0, 9274.0, 3796.0, 1760.0, 895.0, 519.0, 310.0, 172.0, 120.0, 62.0, 50.0, 29.0, 21.0, 15.0, 16.0, 6.0, 10.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.00958251953125, -0.009284377098083496, -0.008986234664916992, -0.008688092231750488, -0.008389949798583984, -0.00809180736541748, -0.0077936649322509766, -0.007495522499084473, -0.007197380065917969, -0.006899237632751465, -0.006601095199584961, -0.006302952766418457, -0.006004810333251953, -0.005706667900085449, -0.005408525466918945, -0.005110383033752441, -0.0048122406005859375, -0.004514098167419434, -0.00421595573425293, -0.003917813301086426, -0.003619670867919922, -0.003321528434753418, -0.003023386001586914, -0.00272524356842041, -0.0024271011352539062, -0.0021289587020874023, -0.0018308162689208984, -0.0015326738357543945, -0.0012345314025878906, -0.0009363889694213867, -0.0006382465362548828, -0.0003401041030883789, -4.1961669921875e-05, 0.0002561807632446289, 0.0005543231964111328, 0.0008524656295776367, 0.0011506080627441406, 0.0014487504959106445, 0.0017468929290771484, 0.0020450353622436523, 0.0023431777954101562, 0.00264132022857666, 0.002939462661743164, 0.003237605094909668, 0.003535747528076172, 0.0038338899612426758, 0.00413203239440918, 0.004430174827575684, 0.0047283172607421875, 0.005026459693908691, 0.005324602127075195, 0.005622744560241699, 0.005920886993408203, 0.006219029426574707, 0.006517171859741211, 0.006815314292907715, 0.007113456726074219, 0.007411599159240723, 0.0077097415924072266, 0.00800788402557373, 0.008306026458740234, 0.008604168891906738, 0.008902311325073242, 0.009200453758239746, 0.00949859619140625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 7.0, 1.0, 12.0, 19.0, 23.0, 40.0, 52.0, 81.0, 133.0, 298.0, 851.0, 1383.0, 578.0, 233.0, 133.0, 78.0, 41.0, 29.0, 18.0, 10.0, 14.0, 5.0, 7.0, 8.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01031494140625, -0.010022759437561035, -0.00973057746887207, -0.009438395500183105, -0.00914621353149414, -0.008854031562805176, -0.008561849594116211, -0.008269667625427246, -0.007977485656738281, -0.007685303688049316, -0.0073931217193603516, -0.007100939750671387, -0.006808757781982422, -0.006516575813293457, -0.006224393844604492, -0.005932211875915527, -0.0056400299072265625, -0.005347847938537598, -0.005055665969848633, -0.004763484001159668, -0.004471302032470703, -0.004179120063781738, -0.0038869380950927734, -0.0035947561264038086, -0.0033025741577148438, -0.003010392189025879, -0.002718210220336914, -0.0024260282516479492, -0.0021338462829589844, -0.0018416643142700195, -0.0015494823455810547, -0.0012573003768920898, -0.000965118408203125, -0.0006729364395141602, -0.0003807544708251953, -8.857250213623047e-05, 0.00020360946655273438, 0.0004957914352416992, 0.0007879734039306641, 0.001080155372619629, 0.0013723373413085938, 0.0016645193099975586, 0.0019567012786865234, 0.0022488832473754883, 0.002541065216064453, 0.002833247184753418, 0.003125429153442383, 0.0034176111221313477, 0.0037097930908203125, 0.004001975059509277, 0.004294157028198242, 0.004586338996887207, 0.004878520965576172, 0.005170702934265137, 0.0054628849029541016, 0.005755066871643066, 0.006047248840332031, 0.006339430809020996, 0.006631612777709961, 0.006923794746398926, 0.007215976715087891, 0.0075081586837768555, 0.00780034065246582, 0.008092522621154785, 0.00838470458984375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 12.0, 39.0, 168.0, 374.0, 297.0, 89.0, 17.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09204760938882828, -0.08801400661468506, -0.08398040384054184, -0.07994680106639862, -0.0759131908416748, -0.07187958806753159, -0.06784598529338837, -0.06381238251924515, -0.05977877601981163, -0.05574517324566841, -0.051711566746234894, -0.047677963972091675, -0.043644361197948456, -0.03961075469851494, -0.03557715192437172, -0.0315435454249382, -0.027509942650794983, -0.023476338014006615, -0.019442733377218246, -0.015409130603075027, -0.01137552596628666, -0.007341921329498291, -0.003308318555355072, 0.0007252860814332962, 0.004758890718221664, 0.008792495355010033, 0.012826099060475826, 0.01685970276594162, 0.020893307402729988, 0.024926912039518356, 0.028960514813661575, 0.03299412131309509, 0.03702773153781891, 0.04106133431196213, 0.045094940811395645, 0.049128543585538864, 0.05316215008497238, 0.0571957528591156, 0.06122935563325882, 0.06526295840740204, 0.06929656863212585, 0.07333017140626907, 0.07736377418041229, 0.08139738440513611, 0.08543098717927933, 0.08946458995342255, 0.09349819272756577, 0.09753179550170898, 0.1015653982758522, 0.10559900104999542, 0.10963260382413864, 0.11366620659828186, 0.11769981682300568, 0.1217334195971489, 0.12576702237129211, 0.12980063259601593, 0.13383422791957855, 0.13786783814430237, 0.141901433467865, 0.1459350436925888, 0.14996863901615143, 0.15400224924087524, 0.15803584456443787, 0.16206945478916168, 0.1661030650138855]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 12.0, 9.0, 11.0, 18.0, 21.0, 34.0, 38.0, 39.0, 39.0, 57.0, 67.0, 68.0, 65.0, 66.0, 60.0, 61.0, 59.0, 46.0, 38.0, 45.0, 39.0, 22.0, 22.0, 15.0, 13.0, 12.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030533015727996826, -0.02957664057612419, -0.028620265424251556, -0.02766389027237892, -0.026707515120506287, -0.02575113996863365, -0.024794764816761017, -0.023838389664888382, -0.022882014513015747, -0.021925639361143112, -0.020969264209270477, -0.020012889057397842, -0.019056513905525208, -0.018100138753652573, -0.017143763601779938, -0.016187388449907303, -0.015231013298034668, -0.014274638146162033, -0.013318262994289398, -0.012361887842416763, -0.011405512690544128, -0.010449137538671494, -0.009492762386798859, -0.008536387234926224, -0.007580012083053589, -0.006623636931180954, -0.005667261779308319, -0.004710886627435684, -0.0037545114755630493, -0.0027981363236904144, -0.0018417611718177795, -0.0008853860199451447, 7.098913192749023e-05, 0.0010273642838001251, 0.00198373943567276, 0.002940114587545395, 0.00389648973941803, 0.004852864891290665, 0.0058092400431632996, 0.0067656151950359344, 0.007721990346908569, 0.008678365498781204, 0.009634740650653839, 0.010591115802526474, 0.011547490954399109, 0.012503866106271744, 0.013460241258144379, 0.014416616410017014, 0.015372991561889648, 0.016329366713762283, 0.017285741865634918, 0.018242117017507553, 0.019198492169380188, 0.020154867321252823, 0.021111242473125458, 0.022067617624998093, 0.023023992776870728, 0.023980367928743362, 0.024936743080615997, 0.025893118232488632, 0.026849493384361267, 0.027805868536233902, 0.028762243688106537, 0.029718618839979172, 0.030674993991851807]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 5.0, 9.0, 21.0, 14.0, 29.0, 29.0, 39.0, 66.0, 88.0, 151.0, 200.0, 338.0, 496.0, 1103.0, 3044.0, 23548.0, 524894.0, 467805.0, 21248.0, 2902.0, 1038.0, 522.0, 322.0, 199.0, 117.0, 93.0, 73.0, 43.0, 27.0, 26.0, 21.0, 14.0, 4.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03656005859375, -0.03520488739013672, -0.03384971618652344, -0.032494544982910156, -0.031139373779296875, -0.029784202575683594, -0.028429031372070312, -0.02707386016845703, -0.02571868896484375, -0.02436351776123047, -0.023008346557617188, -0.021653175354003906, -0.020298004150390625, -0.018942832946777344, -0.017587661743164062, -0.01623249053955078, -0.0148773193359375, -0.013522148132324219, -0.012166976928710938, -0.010811805725097656, -0.009456634521484375, -0.008101463317871094, -0.0067462921142578125, -0.005391120910644531, -0.00403594970703125, -0.0026807785034179688, -0.0013256072998046875, 2.956390380859375e-05, 0.001384735107421875, 0.0027399063110351562, 0.0040950775146484375, 0.005450248718261719, 0.006805419921875, 0.008160591125488281, 0.009515762329101562, 0.010870933532714844, 0.012226104736328125, 0.013581275939941406, 0.014936447143554688, 0.01629161834716797, 0.01764678955078125, 0.01900196075439453, 0.020357131958007812, 0.021712303161621094, 0.023067474365234375, 0.024422645568847656, 0.025777816772460938, 0.02713298797607422, 0.0284881591796875, 0.02984333038330078, 0.031198501586914062, 0.032553672790527344, 0.033908843994140625, 0.035264015197753906, 0.03661918640136719, 0.03797435760498047, 0.03932952880859375, 0.04068470001220703, 0.04203987121582031, 0.043395042419433594, 0.044750213623046875, 0.046105384826660156, 0.04746055603027344, 0.04881572723388672, 0.0501708984375]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 16.0, 59.0, 182.0, 222.0, 235.0, 190.0, 71.0, 23.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0210418701171875, -0.0205533504486084, -0.020064830780029297, -0.019576311111450195, -0.019087791442871094, -0.018599271774291992, -0.01811075210571289, -0.01762223243713379, -0.017133712768554688, -0.016645193099975586, -0.016156673431396484, -0.015668153762817383, -0.015179634094238281, -0.01469111442565918, -0.014202594757080078, -0.013714075088500977, -0.013225555419921875, -0.012737035751342773, -0.012248516082763672, -0.01175999641418457, -0.011271476745605469, -0.010782957077026367, -0.010294437408447266, -0.009805917739868164, -0.009317398071289062, -0.008828878402709961, -0.00834035873413086, -0.007851839065551758, -0.007363319396972656, -0.006874799728393555, -0.006386280059814453, -0.0058977603912353516, -0.00540924072265625, -0.0049207210540771484, -0.004432201385498047, -0.003943681716918945, -0.0034551620483398438, -0.002966642379760742, -0.0024781227111816406, -0.001989603042602539, -0.0015010833740234375, -0.001012563705444336, -0.0005240440368652344, -3.552436828613281e-05, 0.00045299530029296875, 0.0009415149688720703, 0.0014300346374511719, 0.0019185543060302734, 0.002407073974609375, 0.0028955936431884766, 0.003384113311767578, 0.0038726329803466797, 0.004361152648925781, 0.004849672317504883, 0.005338191986083984, 0.005826711654663086, 0.0063152313232421875, 0.006803750991821289, 0.007292270660400391, 0.007780790328979492, 0.008269309997558594, 0.008757829666137695, 0.009246349334716797, 0.009734869003295898, 0.010223388671875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 2.0, 5.0, 3.0, 1.0, 7.0, 11.0, 9.0, 11.0, 18.0, 24.0, 28.0, 42.0, 68.0, 84.0, 146.0, 207.0, 316.0, 403.0, 646.0, 1054.0, 1657.0, 3057.0, 5218.0, 9766.0, 18618.0, 37030.0, 77010.0, 163639.0, 279603.0, 227484.0, 112467.0, 53400.0, 26258.0, 13163.0, 7044.0, 4040.0, 2200.0, 1303.0, 859.0, 529.0, 358.0, 240.0, 169.0, 105.0, 77.0, 52.0, 26.0, 32.0, 17.0, 18.0, 9.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 2.0, 4.0, 3.0], "bins": [-0.00882720947265625, -0.008557677268981934, -0.008288145065307617, -0.0080186128616333, -0.007749080657958984, -0.007479548454284668, -0.0072100162506103516, -0.006940484046936035, -0.006670951843261719, -0.006401419639587402, -0.006131887435913086, -0.0058623552322387695, -0.005592823028564453, -0.005323290824890137, -0.00505375862121582, -0.004784226417541504, -0.0045146942138671875, -0.004245162010192871, -0.003975629806518555, -0.0037060976028442383, -0.003436565399169922, -0.0031670331954956055, -0.002897500991821289, -0.0026279687881469727, -0.0023584365844726562, -0.00208890438079834, -0.0018193721771240234, -0.001549839973449707, -0.0012803077697753906, -0.0010107755661010742, -0.0007412433624267578, -0.0004717111587524414, -0.000202178955078125, 6.73532485961914e-05, 0.0003368854522705078, 0.0006064176559448242, 0.0008759498596191406, 0.001145482063293457, 0.0014150142669677734, 0.0016845464706420898, 0.0019540786743164062, 0.0022236108779907227, 0.002493143081665039, 0.0027626752853393555, 0.003032207489013672, 0.0033017396926879883, 0.0035712718963623047, 0.003840804100036621, 0.0041103363037109375, 0.004379868507385254, 0.00464940071105957, 0.004918932914733887, 0.005188465118408203, 0.0054579973220825195, 0.005727529525756836, 0.005997061729431152, 0.006266593933105469, 0.006536126136779785, 0.0068056583404541016, 0.007075190544128418, 0.007344722747802734, 0.007614254951477051, 0.007883787155151367, 0.008153319358825684, 0.0084228515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 3.0, 6.0, 10.0, 9.0, 11.0, 24.0, 20.0, 46.0, 47.0, 54.0, 61.0, 66.0, 92.0, 99.0, 75.0, 77.0, 70.0, 66.0, 45.0, 30.0, 29.0, 20.0, 13.0, 13.0, 3.0, 6.0, 1.0, 5.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0181427001953125, -0.01754593849182129, -0.016949176788330078, -0.016352415084838867, -0.015755653381347656, -0.015158891677856445, -0.014562129974365234, -0.013965368270874023, -0.013368606567382812, -0.012771844863891602, -0.01217508316040039, -0.01157832145690918, -0.010981559753417969, -0.010384798049926758, -0.009788036346435547, -0.009191274642944336, -0.008594512939453125, -0.007997751235961914, -0.007400989532470703, -0.006804227828979492, -0.006207466125488281, -0.00561070442199707, -0.005013942718505859, -0.0044171810150146484, -0.0038204193115234375, -0.0032236576080322266, -0.0026268959045410156, -0.0020301342010498047, -0.0014333724975585938, -0.0008366107940673828, -0.00023984909057617188, 0.00035691261291503906, 0.00095367431640625, 0.001550436019897461, 0.002147197723388672, 0.002743959426879883, 0.0033407211303710938, 0.003937482833862305, 0.004534244537353516, 0.0051310062408447266, 0.0057277679443359375, 0.0063245296478271484, 0.006921291351318359, 0.00751805305480957, 0.008114814758300781, 0.008711576461791992, 0.009308338165283203, 0.009905099868774414, 0.010501861572265625, 0.011098623275756836, 0.011695384979248047, 0.012292146682739258, 0.012888908386230469, 0.01348567008972168, 0.01408243179321289, 0.014679193496704102, 0.015275955200195312, 0.015872716903686523, 0.016469478607177734, 0.017066240310668945, 0.017663002014160156, 0.018259763717651367, 0.018856525421142578, 0.01945328712463379, 0.020050048828125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 10.0, 10.0, 18.0, 14.0, 20.0, 40.0, 50.0, 67.0, 90.0, 169.0, 251.0, 354.0, 588.0, 995.0, 1794.0, 3068.0, 5882.0, 11070.0, 22340.0, 46921.0, 110993.0, 305238.0, 322382.0, 117912.0, 49346.0, 23197.0, 11777.0, 6072.0, 3266.0, 1789.0, 1026.0, 655.0, 390.0, 253.0, 157.0, 101.0, 79.0, 49.0, 37.0, 19.0, 16.0, 10.0, 12.0, 3.0, 8.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.00543212890625, -0.005267679691314697, -0.0051032304763793945, -0.004938781261444092, -0.004774332046508789, -0.004609882831573486, -0.004445433616638184, -0.004280984401702881, -0.004116535186767578, -0.003952085971832275, -0.0037876367568969727, -0.00362318754196167, -0.003458738327026367, -0.0032942891120910645, -0.0031298398971557617, -0.002965390682220459, -0.0028009414672851562, -0.0026364922523498535, -0.0024720430374145508, -0.002307593822479248, -0.0021431446075439453, -0.0019786953926086426, -0.0018142461776733398, -0.0016497969627380371, -0.0014853477478027344, -0.0013208985328674316, -0.001156449317932129, -0.0009920001029968262, -0.0008275508880615234, -0.0006631016731262207, -0.000498652458190918, -0.00033420324325561523, -0.0001697540283203125, -5.304813385009766e-06, 0.00015914440155029297, 0.0003235936164855957, 0.00048804283142089844, 0.0006524920463562012, 0.0008169412612915039, 0.0009813904762268066, 0.0011458396911621094, 0.0013102889060974121, 0.0014747381210327148, 0.0016391873359680176, 0.0018036365509033203, 0.001968085765838623, 0.0021325349807739258, 0.0022969841957092285, 0.0024614334106445312, 0.002625882625579834, 0.0027903318405151367, 0.0029547810554504395, 0.003119230270385742, 0.003283679485321045, 0.0034481287002563477, 0.0036125779151916504, 0.003777027130126953, 0.003941476345062256, 0.004105925559997559, 0.004270374774932861, 0.004434823989868164, 0.004599273204803467, 0.0047637224197387695, 0.004928171634674072, 0.005092620849609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 5.0, 3.0, 2.0, 5.0, 7.0, 9.0, 8.0, 4.0, 14.0, 8.0, 18.0, 14.0, 21.0, 26.0, 22.0, 40.0, 55.0, 47.0, 61.0, 75.0, 75.0, 61.0, 65.0, 52.0, 38.0, 41.0, 41.0, 32.0, 34.0, 24.0, 19.0, 10.0, 10.0, 12.0, 6.0, 5.0, 12.0, 6.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7087669372558594e-05, -4.565343260765076e-05, -4.421919584274292e-05, -4.278495907783508e-05, -4.1350722312927246e-05, -3.991648554801941e-05, -3.848224878311157e-05, -3.7048012018203735e-05, -3.56137752532959e-05, -3.417953848838806e-05, -3.2745301723480225e-05, -3.131106495857239e-05, -2.987682819366455e-05, -2.8442591428756714e-05, -2.7008354663848877e-05, -2.557411789894104e-05, -2.4139881134033203e-05, -2.2705644369125366e-05, -2.127140760421753e-05, -1.9837170839309692e-05, -1.8402934074401855e-05, -1.696869730949402e-05, -1.553446054458618e-05, -1.4100223779678345e-05, -1.2665987014770508e-05, -1.1231750249862671e-05, -9.797513484954834e-06, -8.363276720046997e-06, -6.92903995513916e-06, -5.494803190231323e-06, -4.060566425323486e-06, -2.6263296604156494e-06, -1.1920928955078125e-06, 2.421438694000244e-07, 1.6763806343078613e-06, 3.1106173992156982e-06, 4.544854164123535e-06, 5.979090929031372e-06, 7.413327693939209e-06, 8.847564458847046e-06, 1.0281801223754883e-05, 1.171603798866272e-05, 1.3150274753570557e-05, 1.4584511518478394e-05, 1.601874828338623e-05, 1.7452985048294067e-05, 1.8887221813201904e-05, 2.032145857810974e-05, 2.1755695343017578e-05, 2.3189932107925415e-05, 2.4624168872833252e-05, 2.605840563774109e-05, 2.7492642402648926e-05, 2.8926879167556763e-05, 3.03611159324646e-05, 3.1795352697372437e-05, 3.3229589462280273e-05, 3.466382622718811e-05, 3.609806299209595e-05, 3.7532299757003784e-05, 3.896653652191162e-05, 4.040077328681946e-05, 4.1835010051727295e-05, 4.326924681663513e-05, 4.470348358154297e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 1.0, 2.0, 2.0, 8.0, 13.0, 19.0, 31.0, 45.0, 72.0, 127.0, 191.0, 344.0, 579.0, 1045.0, 1850.0, 3430.0, 6280.0, 11452.0, 21525.0, 41506.0, 85346.0, 201506.0, 342767.0, 174825.0, 75664.0, 37412.0, 19361.0, 10529.0, 5500.0, 3091.0, 1688.0, 971.0, 533.0, 352.0, 193.0, 108.0, 74.0, 49.0, 29.0, 15.0, 12.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 1.0, 2.0, 3.0], "bins": [-0.00478363037109375, -0.004652291536331177, -0.0045209527015686035, -0.00438961386680603, -0.004258275032043457, -0.004126936197280884, -0.0039955973625183105, -0.0038642585277557373, -0.003732919692993164, -0.003601580858230591, -0.0034702420234680176, -0.0033389031887054443, -0.003207564353942871, -0.003076225519180298, -0.0029448866844177246, -0.0028135478496551514, -0.002682209014892578, -0.002550870180130005, -0.0024195313453674316, -0.0022881925106048584, -0.002156853675842285, -0.002025514841079712, -0.0018941760063171387, -0.0017628371715545654, -0.0016314983367919922, -0.001500159502029419, -0.0013688206672668457, -0.0012374818325042725, -0.0011061429977416992, -0.000974804162979126, -0.0008434653282165527, -0.0007121264934539795, -0.0005807876586914062, -0.000449448823928833, -0.00031810998916625977, -0.00018677115440368652, -5.543231964111328e-05, 7.590651512145996e-05, 0.0002072453498840332, 0.00033858418464660645, 0.0004699230194091797, 0.0006012618541717529, 0.0007326006889343262, 0.0008639395236968994, 0.0009952783584594727, 0.001126617193222046, 0.0012579560279846191, 0.0013892948627471924, 0.0015206336975097656, 0.0016519725322723389, 0.0017833113670349121, 0.0019146502017974854, 0.0020459890365600586, 0.002177327871322632, 0.002308666706085205, 0.0024400055408477783, 0.0025713443756103516, 0.002702683210372925, 0.002834022045135498, 0.0029653608798980713, 0.0030966997146606445, 0.0032280385494232178, 0.003359377384185791, 0.0034907162189483643, 0.0036220550537109375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 7.0, 2.0, 5.0, 5.0, 7.0, 3.0, 10.0, 8.0, 16.0, 13.0, 13.0, 24.0, 23.0, 22.0, 25.0, 27.0, 38.0, 55.0, 49.0, 71.0, 71.0, 55.0, 82.0, 55.0, 46.0, 42.0, 34.0, 32.0, 29.0, 22.0, 16.0, 15.0, 12.0, 9.0, 6.0, 11.0, 11.0, 6.0, 3.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0], "bins": [-0.00469970703125, -0.004569441080093384, -0.004439175128936768, -0.004308909177780151, -0.004178643226623535, -0.004048377275466919, -0.003918111324310303, -0.0037878453731536865, -0.0036575794219970703, -0.003527313470840454, -0.003397047519683838, -0.0032667815685272217, -0.0031365156173706055, -0.0030062496662139893, -0.002875983715057373, -0.002745717763900757, -0.0026154518127441406, -0.0024851858615875244, -0.002354919910430908, -0.002224653959274292, -0.0020943880081176758, -0.0019641220569610596, -0.0018338561058044434, -0.0017035901546478271, -0.001573324203491211, -0.0014430582523345947, -0.0013127923011779785, -0.0011825263500213623, -0.001052260398864746, -0.0009219944477081299, -0.0007917284965515137, -0.0006614625453948975, -0.0005311965942382812, -0.00040093064308166504, -0.00027066469192504883, -0.00014039874076843262, -1.0132789611816406e-05, 0.0001201331615447998, 0.000250399112701416, 0.0003806650638580322, 0.0005109310150146484, 0.0006411969661712646, 0.0007714629173278809, 0.0009017288684844971, 0.0010319948196411133, 0.0011622607707977295, 0.0012925267219543457, 0.001422792673110962, 0.0015530586242675781, 0.0016833245754241943, 0.0018135905265808105, 0.0019438564777374268, 0.002074122428894043, 0.002204388380050659, 0.0023346543312072754, 0.0024649202823638916, 0.002595186233520508, 0.002725452184677124, 0.0028557181358337402, 0.0029859840869903564, 0.0031162500381469727, 0.003246515989303589, 0.003376781940460205, 0.0035070478916168213, 0.0036373138427734375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 9.0, 8.0, 19.0, 48.0, 43.0, 87.0, 103.0, 165.0, 172.0, 121.0, 99.0, 55.0, 28.0, 17.0, 6.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1124572902917862, -0.10961233079433441, -0.10676737129688263, -0.10392241179943085, -0.10107745230197906, -0.09823249280452728, -0.0953875333070755, -0.09254258126020432, -0.08969762176275253, -0.08685266226530075, -0.08400770276784897, -0.08116274327039719, -0.0783177837729454, -0.07547283172607422, -0.07262787222862244, -0.06978291273117065, -0.06693795323371887, -0.06409299373626709, -0.06124803423881531, -0.058403074741363525, -0.05555811896920204, -0.05271315947175026, -0.04986819997429848, -0.04702324420213699, -0.044178277254104614, -0.04133331775665283, -0.03848835825920105, -0.03564339876174927, -0.032798442989587784, -0.029953483492136, -0.02710852399468422, -0.024263566359877586, -0.021418608725070953, -0.01857364922761917, -0.015728691592812538, -0.012883732095360756, -0.010038773529231548, -0.007193814963102341, -0.0043488554656505585, -0.0015038978308439255, 0.0013410616666078568, 0.004186020232737064, 0.007030979264527559, 0.009875938296318054, 0.012720896862447262, 0.01556585542857647, 0.01841081492602825, 0.021255772560834885, 0.024100732058286667, 0.02694569155573845, 0.029790649190545082, 0.032635606825351715, 0.0354805663228035, 0.03832552582025528, 0.04117048531770706, 0.044015444815158844, 0.046860404312610626, 0.04970536381006241, 0.05255032330751419, 0.05539528280496597, 0.05824023857712746, 0.06108519807457924, 0.06393015384674072, 0.0667751133441925, 0.06962007284164429]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 0.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 11.0, 11.0, 17.0, 9.0, 13.0, 24.0, 23.0, 28.0, 21.0, 27.0, 44.0, 35.0, 30.0, 38.0, 40.0, 33.0, 36.0, 40.0, 40.0, 42.0, 40.0, 37.0, 42.0, 33.0, 30.0, 38.0, 24.0, 24.0, 27.0, 17.0, 18.0, 18.0, 18.0, 10.0, 13.0, 7.0, 12.0, 10.0, 5.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.03746926784515381, -0.03637545183300972, -0.03528163582086563, -0.034187816083431244, -0.033094000071287155, -0.032000184059143066, -0.03090636618435383, -0.02981254830956459, -0.0287187322974205, -0.027624916285276413, -0.026531098410487175, -0.025437280535697937, -0.02434346452355385, -0.02324964851140976, -0.02215583063662052, -0.021062012761831284, -0.019968196749687195, -0.018874380737543106, -0.017780562862753868, -0.01668674498796463, -0.015592928975820541, -0.014499112032353878, -0.013405295088887215, -0.012311478145420551, -0.011217661201953888, -0.010123844258487225, -0.009030027315020561, -0.007936210371553898, -0.0068423934280872345, -0.005748576484620571, -0.004654759541153908, -0.0035609425976872444, -0.002467125654220581, -0.0013733087107539177, -0.00027949176728725433, 0.000814325176179409, 0.0019081421196460724, 0.0030019590631127357, 0.004095776006579399, 0.0051895929500460625, 0.006283409893512726, 0.007377226836979389, 0.008471043780446053, 0.009564860723912716, 0.01065867766737938, 0.011752494610846043, 0.012846311554312706, 0.01394012849777937, 0.015033945441246033, 0.01612776145339012, 0.01722157932817936, 0.018315397202968597, 0.019409213215112686, 0.020503029227256775, 0.021596847102046013, 0.02269066497683525, 0.02378448098897934, 0.02487829700112343, 0.025972114875912666, 0.027065932750701904, 0.028159748762845993, 0.029253564774990082, 0.03034738264977932, 0.03144120052456856, 0.032535016536712646]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 12.0, 17.0, 14.0, 22.0, 40.0, 57.0, 88.0, 195.0, 522.0, 1710.0, 9107.0, 91551.0, 3938003.0, 137350.0, 11280.0, 2652.0, 993.0, 421.0, 125.0, 49.0, 28.0, 15.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0212860107421875, -0.020632266998291016, -0.01997852325439453, -0.019324779510498047, -0.018671035766601562, -0.018017292022705078, -0.017363548278808594, -0.01670980453491211, -0.016056060791015625, -0.01540231704711914, -0.014748573303222656, -0.014094829559326172, -0.013441085815429688, -0.012787342071533203, -0.012133598327636719, -0.011479854583740234, -0.01082611083984375, -0.010172367095947266, -0.009518623352050781, -0.008864879608154297, -0.008211135864257812, -0.007557392120361328, -0.006903648376464844, -0.006249904632568359, -0.005596160888671875, -0.004942417144775391, -0.004288673400878906, -0.003634929656982422, -0.0029811859130859375, -0.002327442169189453, -0.0016736984252929688, -0.0010199546813964844, -0.0003662109375, 0.0002875328063964844, 0.0009412765502929688, 0.0015950202941894531, 0.0022487640380859375, 0.002902507781982422, 0.0035562515258789062, 0.004209995269775391, 0.004863739013671875, 0.005517482757568359, 0.006171226501464844, 0.006824970245361328, 0.0074787139892578125, 0.008132457733154297, 0.008786201477050781, 0.009439945220947266, 0.01009368896484375, 0.010747432708740234, 0.011401176452636719, 0.012054920196533203, 0.012708663940429688, 0.013362407684326172, 0.014016151428222656, 0.01466989517211914, 0.015323638916015625, 0.01597738265991211, 0.016631126403808594, 0.017284870147705078, 0.017938613891601562, 0.018592357635498047, 0.01924610137939453, 0.019899845123291016, 0.0205535888671875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 26.0, 84.0, 181.0, 228.0, 257.0, 137.0, 64.0, 19.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.023284912109375, -0.02274167537689209, -0.02219843864440918, -0.02165520191192627, -0.02111196517944336, -0.02056872844696045, -0.02002549171447754, -0.01948225498199463, -0.01893901824951172, -0.01839578151702881, -0.0178525447845459, -0.01730930805206299, -0.016766071319580078, -0.016222834587097168, -0.015679597854614258, -0.015136361122131348, -0.014593124389648438, -0.014049887657165527, -0.013506650924682617, -0.012963414192199707, -0.012420177459716797, -0.011876940727233887, -0.011333703994750977, -0.010790467262268066, -0.010247230529785156, -0.009703993797302246, -0.009160757064819336, -0.008617520332336426, -0.008074283599853516, -0.0075310468673706055, -0.006987810134887695, -0.006444573402404785, -0.005901336669921875, -0.005358099937438965, -0.004814863204956055, -0.0042716264724731445, -0.0037283897399902344, -0.0031851530075073242, -0.002641916275024414, -0.002098679542541504, -0.0015554428100585938, -0.0010122060775756836, -0.00046896934509277344, 7.426738739013672e-05, 0.0006175041198730469, 0.001160740852355957, 0.0017039775848388672, 0.0022472143173217773, 0.0027904510498046875, 0.0033336877822875977, 0.003876924514770508, 0.004420161247253418, 0.004963397979736328, 0.005506634712219238, 0.0060498714447021484, 0.006593108177185059, 0.007136344909667969, 0.007679581642150879, 0.008222818374633789, 0.0087660551071167, 0.00930929183959961, 0.00985252857208252, 0.01039576530456543, 0.01093900203704834, 0.01148223876953125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 12.0, 10.0, 14.0, 19.0, 23.0, 45.0, 69.0, 141.0, 257.0, 469.0, 1200.0, 2996.0, 9716.0, 42719.0, 440071.0, 3515461.0, 148441.0, 22845.0, 5988.0, 2084.0, 807.0, 417.0, 198.0, 117.0, 58.0, 43.0, 27.0, 19.0, 10.0, 7.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01165008544921875, -0.011207222938537598, -0.010764360427856445, -0.010321497917175293, -0.00987863540649414, -0.009435772895812988, -0.008992910385131836, -0.008550047874450684, -0.008107185363769531, -0.007664322853088379, -0.0072214603424072266, -0.006778597831726074, -0.006335735321044922, -0.0058928728103637695, -0.005450010299682617, -0.005007147789001465, -0.0045642852783203125, -0.00412142276763916, -0.003678560256958008, -0.0032356977462768555, -0.002792835235595703, -0.0023499727249145508, -0.0019071102142333984, -0.001464247703552246, -0.0010213851928710938, -0.0005785226821899414, -0.00013566017150878906, 0.0003072023391723633, 0.0007500648498535156, 0.001192927360534668, 0.0016357898712158203, 0.0020786523818969727, 0.002521514892578125, 0.0029643774032592773, 0.0034072399139404297, 0.003850102424621582, 0.004292964935302734, 0.004735827445983887, 0.005178689956665039, 0.005621552467346191, 0.006064414978027344, 0.006507277488708496, 0.0069501399993896484, 0.007393002510070801, 0.007835865020751953, 0.008278727531433105, 0.008721590042114258, 0.00916445255279541, 0.009607315063476562, 0.010050177574157715, 0.010493040084838867, 0.01093590259552002, 0.011378765106201172, 0.011821627616882324, 0.012264490127563477, 0.012707352638244629, 0.013150215148925781, 0.013593077659606934, 0.014035940170288086, 0.014478802680969238, 0.01492166519165039, 0.015364527702331543, 0.015807390213012695, 0.016250252723693848, 0.016693115234375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 5.0, 3.0, 1.0, 6.0, 15.0, 7.0, 21.0, 24.0, 33.0, 63.0, 115.0, 230.0, 582.0, 1282.0, 896.0, 323.0, 161.0, 102.0, 69.0, 40.0, 24.0, 24.0, 11.0, 8.0, 5.0, 8.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01123046875, -0.010886669158935547, -0.010542869567871094, -0.01019906997680664, -0.009855270385742188, -0.009511470794677734, -0.009167671203613281, -0.008823871612548828, -0.008480072021484375, -0.008136272430419922, -0.007792472839355469, -0.007448673248291016, -0.0071048736572265625, -0.006761074066162109, -0.006417274475097656, -0.006073474884033203, -0.00572967529296875, -0.005385875701904297, -0.005042076110839844, -0.004698276519775391, -0.0043544769287109375, -0.004010677337646484, -0.0036668777465820312, -0.003323078155517578, -0.002979278564453125, -0.002635478973388672, -0.0022916793823242188, -0.0019478797912597656, -0.0016040802001953125, -0.0012602806091308594, -0.0009164810180664062, -0.0005726814270019531, -0.0002288818359375, 0.00011491775512695312, 0.00045871734619140625, 0.0008025169372558594, 0.0011463165283203125, 0.0014901161193847656, 0.0018339157104492188, 0.002177715301513672, 0.002521514892578125, 0.002865314483642578, 0.0032091140747070312, 0.0035529136657714844, 0.0038967132568359375, 0.004240512847900391, 0.004584312438964844, 0.004928112030029297, 0.00527191162109375, 0.005615711212158203, 0.005959510803222656, 0.006303310394287109, 0.0066471099853515625, 0.006990909576416016, 0.007334709167480469, 0.007678508758544922, 0.008022308349609375, 0.008366107940673828, 0.008709907531738281, 0.009053707122802734, 0.009397506713867188, 0.00974130630493164, 0.010085105895996094, 0.010428905487060547, 0.010772705078125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 8.0, 14.0, 82.0, 237.0, 359.0, 203.0, 66.0, 20.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07317794114351273, -0.06897740811109543, -0.06477688252925873, -0.06057634949684143, -0.05637582018971443, -0.05217529088258743, -0.047974757850170135, -0.04377422854304314, -0.03957369923591614, -0.03537316992878914, -0.03117263875901699, -0.026972107589244843, -0.022771578282117844, -0.018571048974990845, -0.014370517805218697, -0.010169986635446548, -0.0059694573283195496, -0.001768927089869976, 0.0024316031485795975, 0.006632133387029171, 0.010832663625478745, 0.015033192932605743, 0.01923372410237789, 0.02343425527215004, 0.02763478457927704, 0.03183531388640404, 0.036035843193531036, 0.040236376225948334, 0.04443690553307533, 0.04863743484020233, 0.05283796787261963, 0.05703849717974663, 0.06123901903629303, 0.06543955206871033, 0.06964007765054703, 0.07384061068296432, 0.07804113626480103, 0.08224166929721832, 0.08644220232963562, 0.09064273536205292, 0.09484326094388962, 0.09904379397630692, 0.10324431955814362, 0.10744485259056091, 0.11164538562297821, 0.11584591120481491, 0.12004644423723221, 0.12424696981906891, 0.1284475028514862, 0.1326480358839035, 0.1368485689163208, 0.1410490870475769, 0.1452496200799942, 0.1494501531124115, 0.1536506861448288, 0.1578512191772461, 0.1620517373085022, 0.1662522703409195, 0.1704528033733368, 0.1746533215045929, 0.1788538545370102, 0.1830543875694275, 0.1872549206018448, 0.19145545363426208, 0.19565598666667938]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 6.0, 8.0, 13.0, 14.0, 22.0, 18.0, 24.0, 26.0, 28.0, 39.0, 42.0, 47.0, 52.0, 55.0, 47.0, 49.0, 54.0, 58.0, 33.0, 56.0, 42.0, 50.0, 46.0, 28.0, 32.0, 23.0, 23.0, 16.0, 13.0, 5.0, 9.0, 10.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.037991344928741455, -0.03697039186954498, -0.03594944253563881, -0.034928493201732635, -0.03390754014253616, -0.03288658708333969, -0.03186563774943352, -0.030844686552882195, -0.02982373535633087, -0.02880278415977955, -0.027781832963228226, -0.026760881766676903, -0.02573993057012558, -0.024718979373574257, -0.023698028177022934, -0.02267707698047161, -0.021656125783920288, -0.020635174587368965, -0.019614223390817642, -0.01859327219426632, -0.017572320997714996, -0.016551369801163673, -0.01553041860461235, -0.014509467408061028, -0.013488516211509705, -0.012467565014958382, -0.011446613818407059, -0.010425662621855736, -0.009404711425304413, -0.00838376022875309, -0.007362809032201767, -0.006341857835650444, -0.005320906639099121, -0.004299955442547798, -0.0032790042459964752, -0.0022580530494451523, -0.0012371018528938293, -0.0002161506563425064, 0.0008048005402088165, 0.0018257517367601395, 0.0028467029333114624, 0.0038676541298627853, 0.004888605326414108, 0.005909556522965431, 0.006930507719516754, 0.007951458916068077, 0.0089724101126194, 0.009993361309170723, 0.011014312505722046, 0.012035263702273369, 0.013056214898824692, 0.014077166095376015, 0.015098117291927338, 0.01611906848847866, 0.017140019685029984, 0.018160970881581306, 0.01918192207813263, 0.020202873274683952, 0.021223824471235275, 0.022244775667786598, 0.02326572686433792, 0.024286678060889244, 0.025307629257440567, 0.02632858045399189, 0.027349531650543213]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 9.0, 10.0, 11.0, 15.0, 21.0, 29.0, 27.0, 47.0, 67.0, 93.0, 151.0, 230.0, 424.0, 846.0, 2304.0, 11497.0, 121565.0, 746096.0, 147177.0, 13283.0, 2583.0, 887.0, 442.0, 247.0, 151.0, 97.0, 75.0, 50.0, 38.0, 27.0, 17.0, 9.0, 14.0, 4.0, 4.0, 5.0, 2.0, 0.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.044586181640625, -0.043172359466552734, -0.04175853729248047, -0.0403447151184082, -0.03893089294433594, -0.03751707077026367, -0.036103248596191406, -0.03468942642211914, -0.033275604248046875, -0.03186178207397461, -0.030447959899902344, -0.029034137725830078, -0.027620315551757812, -0.026206493377685547, -0.02479267120361328, -0.023378849029541016, -0.02196502685546875, -0.020551204681396484, -0.01913738250732422, -0.017723560333251953, -0.016309738159179688, -0.014895915985107422, -0.013482093811035156, -0.01206827163696289, -0.010654449462890625, -0.00924062728881836, -0.007826805114746094, -0.006412982940673828, -0.0049991607666015625, -0.003585338592529297, -0.0021715164184570312, -0.0007576942443847656, 0.0006561279296875, 0.0020699501037597656, 0.0034837722778320312, 0.004897594451904297, 0.0063114166259765625, 0.007725238800048828, 0.009139060974121094, 0.01055288314819336, 0.011966705322265625, 0.01338052749633789, 0.014794349670410156, 0.016208171844482422, 0.017621994018554688, 0.019035816192626953, 0.02044963836669922, 0.021863460540771484, 0.02327728271484375, 0.024691104888916016, 0.02610492706298828, 0.027518749237060547, 0.028932571411132812, 0.030346393585205078, 0.031760215759277344, 0.03317403793334961, 0.034587860107421875, 0.03600168228149414, 0.037415504455566406, 0.03882932662963867, 0.04024314880371094, 0.0416569709777832, 0.04307079315185547, 0.044484615325927734, 0.0458984375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 8.0, 23.0, 66.0, 167.0, 214.0, 227.0, 154.0, 95.0, 39.0, 10.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0219573974609375, -0.021423697471618652, -0.020889997482299805, -0.020356297492980957, -0.01982259750366211, -0.01928889751434326, -0.018755197525024414, -0.018221497535705566, -0.01768779754638672, -0.01715409755706787, -0.016620397567749023, -0.016086697578430176, -0.015552997589111328, -0.01501929759979248, -0.014485597610473633, -0.013951897621154785, -0.013418197631835938, -0.01288449764251709, -0.012350797653198242, -0.011817097663879395, -0.011283397674560547, -0.0107496976852417, -0.010215997695922852, -0.009682297706604004, -0.009148597717285156, -0.008614897727966309, -0.008081197738647461, -0.007547497749328613, -0.007013797760009766, -0.006480097770690918, -0.00594639778137207, -0.005412697792053223, -0.004878997802734375, -0.004345297813415527, -0.0038115978240966797, -0.003277897834777832, -0.0027441978454589844, -0.0022104978561401367, -0.001676797866821289, -0.0011430978775024414, -0.0006093978881835938, -7.56978988647461e-05, 0.00045800209045410156, 0.0009917020797729492, 0.0015254020690917969, 0.0020591020584106445, 0.002592802047729492, 0.00312650203704834, 0.0036602020263671875, 0.004193902015686035, 0.004727602005004883, 0.0052613019943237305, 0.005795001983642578, 0.006328701972961426, 0.0068624019622802734, 0.007396101951599121, 0.007929801940917969, 0.008463501930236816, 0.008997201919555664, 0.009530901908874512, 0.01006460189819336, 0.010598301887512207, 0.011132001876831055, 0.011665701866149902, 0.01219940185546875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 5.0, 4.0, 0.0, 6.0, 10.0, 12.0, 10.0, 21.0, 31.0, 35.0, 60.0, 93.0, 125.0, 228.0, 349.0, 542.0, 992.0, 1784.0, 3294.0, 6627.0, 14188.0, 32255.0, 77061.0, 189209.0, 337389.0, 221201.0, 92125.0, 38135.0, 16471.0, 7727.0, 3799.0, 1957.0, 1099.0, 627.0, 389.0, 230.0, 135.0, 106.0, 81.0, 40.0, 23.0, 29.0, 21.0, 9.0, 9.0, 2.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01531982421875, -0.014863848686218262, -0.014407873153686523, -0.013951897621154785, -0.013495922088623047, -0.013039946556091309, -0.01258397102355957, -0.012127995491027832, -0.011672019958496094, -0.011216044425964355, -0.010760068893432617, -0.010304093360900879, -0.00984811782836914, -0.009392142295837402, -0.008936166763305664, -0.008480191230773926, -0.008024215698242188, -0.007568240165710449, -0.007112264633178711, -0.006656289100646973, -0.006200313568115234, -0.005744338035583496, -0.005288362503051758, -0.0048323869705200195, -0.004376411437988281, -0.003920435905456543, -0.0034644603729248047, -0.0030084848403930664, -0.002552509307861328, -0.00209653377532959, -0.0016405582427978516, -0.0011845827102661133, -0.000728607177734375, -0.0002726316452026367, 0.00018334388732910156, 0.0006393194198608398, 0.0010952949523925781, 0.0015512704849243164, 0.0020072460174560547, 0.002463221549987793, 0.0029191970825195312, 0.0033751726150512695, 0.003831148147583008, 0.004287123680114746, 0.004743099212646484, 0.005199074745178223, 0.005655050277709961, 0.006111025810241699, 0.0065670013427734375, 0.007022976875305176, 0.007478952407836914, 0.007934927940368652, 0.00839090347290039, 0.008846879005432129, 0.009302854537963867, 0.009758830070495605, 0.010214805603027344, 0.010670781135559082, 0.01112675666809082, 0.011582732200622559, 0.012038707733154297, 0.012494683265686035, 0.012950658798217773, 0.013406634330749512, 0.01386260986328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 8.0, 5.0, 5.0, 3.0, 7.0, 16.0, 19.0, 11.0, 26.0, 26.0, 24.0, 50.0, 42.0, 48.0, 41.0, 55.0, 72.0, 56.0, 66.0, 47.0, 54.0, 48.0, 44.0, 44.0, 32.0, 25.0, 24.0, 26.0, 17.0, 14.0, 14.0, 3.0, 7.0, 5.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0174102783203125, -0.01684403419494629, -0.016277790069580078, -0.015711545944213867, -0.015145301818847656, -0.014579057693481445, -0.014012813568115234, -0.013446569442749023, -0.012880325317382812, -0.012314081192016602, -0.01174783706665039, -0.01118159294128418, -0.010615348815917969, -0.010049104690551758, -0.009482860565185547, -0.008916616439819336, -0.008350372314453125, -0.007784128189086914, -0.007217884063720703, -0.006651639938354492, -0.006085395812988281, -0.00551915168762207, -0.004952907562255859, -0.0043866634368896484, -0.0038204193115234375, -0.0032541751861572266, -0.0026879310607910156, -0.0021216869354248047, -0.0015554428100585938, -0.0009891986846923828, -0.0004229545593261719, 0.00014328956604003906, 0.00070953369140625, 0.001275777816772461, 0.0018420219421386719, 0.002408266067504883, 0.0029745101928710938, 0.0035407543182373047, 0.004106998443603516, 0.0046732425689697266, 0.0052394866943359375, 0.0058057308197021484, 0.006371974945068359, 0.00693821907043457, 0.007504463195800781, 0.008070707321166992, 0.008636951446533203, 0.009203195571899414, 0.009769439697265625, 0.010335683822631836, 0.010901927947998047, 0.011468172073364258, 0.012034416198730469, 0.01260066032409668, 0.01316690444946289, 0.013733148574829102, 0.014299392700195312, 0.014865636825561523, 0.015431880950927734, 0.015998125076293945, 0.016564369201660156, 0.017130613327026367, 0.017696857452392578, 0.01826310157775879, 0.018829345703125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 3.0, 10.0, 11.0, 25.0, 26.0, 44.0, 71.0, 102.0, 182.0, 317.0, 531.0, 942.0, 1739.0, 3430.0, 7062.0, 15952.0, 39074.0, 116576.0, 453819.0, 285244.0, 73342.0, 27278.0, 11552.0, 5294.0, 2647.0, 1387.0, 770.0, 418.0, 306.0, 132.0, 97.0, 53.0, 34.0, 25.0, 19.0, 14.0, 5.0, 3.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01015472412109375, -0.009835481643676758, -0.009516239166259766, -0.009196996688842773, -0.008877754211425781, -0.008558511734008789, -0.008239269256591797, -0.007920026779174805, -0.0076007843017578125, -0.00728154182434082, -0.006962299346923828, -0.006643056869506836, -0.006323814392089844, -0.0060045719146728516, -0.005685329437255859, -0.005366086959838867, -0.005046844482421875, -0.004727602005004883, -0.004408359527587891, -0.0040891170501708984, -0.0037698745727539062, -0.003450632095336914, -0.003131389617919922, -0.0028121471405029297, -0.0024929046630859375, -0.0021736621856689453, -0.0018544197082519531, -0.001535177230834961, -0.0012159347534179688, -0.0008966922760009766, -0.0005774497985839844, -0.0002582073211669922, 6.103515625e-05, 0.0003802776336669922, 0.0006995201110839844, 0.0010187625885009766, 0.0013380050659179688, 0.001657247543334961, 0.001976490020751953, 0.0022957324981689453, 0.0026149749755859375, 0.0029342174530029297, 0.003253459930419922, 0.003572702407836914, 0.0038919448852539062, 0.0042111873626708984, 0.004530429840087891, 0.004849672317504883, 0.005168914794921875, 0.005488157272338867, 0.005807399749755859, 0.0061266422271728516, 0.006445884704589844, 0.006765127182006836, 0.007084369659423828, 0.00740361213684082, 0.0077228546142578125, 0.008042097091674805, 0.008361339569091797, 0.008680582046508789, 0.008999824523925781, 0.009319067001342773, 0.009638309478759766, 0.009957551956176758, 0.01027679443359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 3.0, 2.0, 6.0, 10.0, 12.0, 13.0, 18.0, 27.0, 42.0, 65.0, 79.0, 95.0, 102.0, 106.0, 102.0, 82.0, 70.0, 53.0, 27.0, 20.0, 13.0, 14.0, 11.0, 7.0, 5.0, 3.0, 0.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.459257125854492e-05, -9.222608059644699e-05, -8.985958993434906e-05, -8.749309927225113e-05, -8.51266086101532e-05, -8.276011794805527e-05, -8.039362728595734e-05, -7.80271366238594e-05, -7.566064596176147e-05, -7.329415529966354e-05, -7.092766463756561e-05, -6.856117397546768e-05, -6.619468331336975e-05, -6.382819265127182e-05, -6.146170198917389e-05, -5.909521132707596e-05, -5.672872066497803e-05, -5.4362230002880096e-05, -5.1995739340782166e-05, -4.9629248678684235e-05, -4.7262758016586304e-05, -4.489626735448837e-05, -4.252977669239044e-05, -4.016328603029251e-05, -3.779679536819458e-05, -3.543030470609665e-05, -3.306381404399872e-05, -3.069732338190079e-05, -2.8330832719802856e-05, -2.5964342057704926e-05, -2.3597851395606995e-05, -2.1231360733509064e-05, -1.8864870071411133e-05, -1.6498379409313202e-05, -1.4131888747215271e-05, -1.176539808511734e-05, -9.39890742301941e-06, -7.032416760921478e-06, -4.665926098823547e-06, -2.2994354367256165e-06, 6.705522537231445e-08, 2.4335458874702454e-06, 4.800036549568176e-06, 7.166527211666107e-06, 9.533017873764038e-06, 1.1899508535861969e-05, 1.42659991979599e-05, 1.663248986005783e-05, 1.8998980522155762e-05, 2.1365471184253693e-05, 2.3731961846351624e-05, 2.6098452508449554e-05, 2.8464943170547485e-05, 3.0831433832645416e-05, 3.319792449474335e-05, 3.556441515684128e-05, 3.793090581893921e-05, 4.029739648103714e-05, 4.266388714313507e-05, 4.5030377805233e-05, 4.739686846733093e-05, 4.9763359129428864e-05, 5.2129849791526794e-05, 5.4496340453624725e-05, 5.6862831115722656e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 12.0, 9.0, 17.0, 28.0, 37.0, 57.0, 81.0, 130.0, 195.0, 379.0, 567.0, 1080.0, 1913.0, 3835.0, 8193.0, 18322.0, 49325.0, 189973.0, 537712.0, 160821.0, 43718.0, 16748.0, 7541.0, 3545.0, 1849.0, 939.0, 624.0, 312.0, 212.0, 128.0, 71.0, 56.0, 51.0, 15.0, 16.0, 11.0, 10.0, 4.0, 3.0, 7.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0119781494140625, -0.011630415916442871, -0.011282682418823242, -0.010934948921203613, -0.010587215423583984, -0.010239481925964355, -0.009891748428344727, -0.009544014930725098, -0.009196281433105469, -0.00884854793548584, -0.008500814437866211, -0.008153080940246582, -0.007805347442626953, -0.007457613945007324, -0.007109880447387695, -0.006762146949768066, -0.0064144134521484375, -0.006066679954528809, -0.00571894645690918, -0.005371212959289551, -0.005023479461669922, -0.004675745964050293, -0.004328012466430664, -0.003980278968811035, -0.0036325454711914062, -0.0032848119735717773, -0.0029370784759521484, -0.0025893449783325195, -0.0022416114807128906, -0.0018938779830932617, -0.0015461444854736328, -0.001198410987854004, -0.000850677490234375, -0.0005029439926147461, -0.0001552104949951172, 0.00019252300262451172, 0.0005402565002441406, 0.0008879899978637695, 0.0012357234954833984, 0.0015834569931030273, 0.0019311904907226562, 0.002278923988342285, 0.002626657485961914, 0.002974390983581543, 0.003322124481201172, 0.0036698579788208008, 0.00401759147644043, 0.004365324974060059, 0.0047130584716796875, 0.005060791969299316, 0.005408525466918945, 0.005756258964538574, 0.006103992462158203, 0.006451725959777832, 0.006799459457397461, 0.00714719295501709, 0.007494926452636719, 0.007842659950256348, 0.008190393447875977, 0.008538126945495605, 0.008885860443115234, 0.009233593940734863, 0.009581327438354492, 0.009929060935974121, 0.01027679443359375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 8.0, 10.0, 8.0, 8.0, 8.0, 9.0, 12.0, 22.0, 22.0, 39.0, 62.0, 83.0, 100.0, 124.0, 119.0, 102.0, 64.0, 52.0, 35.0, 19.0, 12.0, 8.0, 12.0, 9.0, 11.0, 6.0, 7.0, 7.0, 5.0, 4.0, 5.0, 4.0, 1.0, 6.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0106048583984375, -0.010271906852722168, -0.009938955307006836, -0.009606003761291504, -0.009273052215576172, -0.00894010066986084, -0.008607149124145508, -0.008274197578430176, -0.007941246032714844, -0.007608294486999512, -0.00727534294128418, -0.006942391395568848, -0.006609439849853516, -0.006276488304138184, -0.0059435367584228516, -0.0056105852127075195, -0.0052776336669921875, -0.0049446821212768555, -0.0046117305755615234, -0.004278779029846191, -0.003945827484130859, -0.0036128759384155273, -0.0032799243927001953, -0.0029469728469848633, -0.0026140213012695312, -0.0022810697555541992, -0.0019481182098388672, -0.0016151666641235352, -0.0012822151184082031, -0.0009492635726928711, -0.0006163120269775391, -0.00028336048126220703, 4.9591064453125e-05, 0.00038254261016845703, 0.0007154941558837891, 0.001048445701599121, 0.0013813972473144531, 0.0017143487930297852, 0.002047300338745117, 0.0023802518844604492, 0.0027132034301757812, 0.0030461549758911133, 0.0033791065216064453, 0.0037120580673217773, 0.004045009613037109, 0.004377961158752441, 0.0047109127044677734, 0.0050438642501831055, 0.0053768157958984375, 0.0057097673416137695, 0.0060427188873291016, 0.006375670433044434, 0.006708621978759766, 0.007041573524475098, 0.00737452507019043, 0.007707476615905762, 0.008040428161621094, 0.008373379707336426, 0.008706331253051758, 0.00903928279876709, 0.009372234344482422, 0.009705185890197754, 0.010038137435913086, 0.010371088981628418, 0.01070404052734375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 4.0, 2.0, 2.0, 9.0, 17.0, 30.0, 56.0, 108.0, 158.0, 199.0, 189.0, 120.0, 53.0, 25.0, 21.0, 1.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2707662582397461, -0.2650006115436554, -0.2592349350452423, -0.2534692883491516, -0.24770361185073853, -0.24193796515464783, -0.23617228865623474, -0.23040664196014404, -0.22464098036289215, -0.21887531876564026, -0.21310965716838837, -0.20734399557113647, -0.20157833397388458, -0.1958126723766327, -0.190047025680542, -0.1842813640832901, -0.1785157024860382, -0.17275004088878632, -0.16698437929153442, -0.16121871769428253, -0.15545305609703064, -0.14968740940093994, -0.14392173290252686, -0.13815608620643616, -0.13239040970802307, -0.12662474811077118, -0.12085908651351929, -0.1150934249162674, -0.1093277707695961, -0.10356210917234421, -0.09779644757509232, -0.09203079342842102, -0.08626512438058853, -0.08049946278333664, -0.07473380118608475, -0.06896814703941345, -0.06320248544216156, -0.05743682384490967, -0.051671162247657776, -0.04590550437569618, -0.04013984277844429, -0.0343741811811924, -0.028608523309230804, -0.022842861711978912, -0.01707720197737217, -0.011311542242765427, -0.0055458806455135345, 0.00021977722644805908, 0.005985438823699951, 0.011751098558306694, 0.017516758292913437, 0.02328241989016533, 0.029048079624772072, 0.034813739359378815, 0.04057940095663071, 0.0463450588285923, 0.05211072042584419, 0.057876382023096085, 0.06364203989505768, 0.06940770149230957, 0.07517336308956146, 0.08093902468681335, 0.08670468628406525, 0.09247034043073654, 0.09823600202798843]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 3.0, 5.0, 6.0, 10.0, 5.0, 8.0, 17.0, 18.0, 12.0, 25.0, 21.0, 29.0, 25.0, 37.0, 44.0, 52.0, 33.0, 30.0, 40.0, 42.0, 37.0, 40.0, 55.0, 42.0, 43.0, 29.0, 34.0, 43.0, 22.0, 43.0, 29.0, 23.0, 21.0, 14.0, 16.0, 10.0, 10.0, 8.0, 6.0, 5.0, 1.0, 5.0, 0.0, 3.0, 1.0, 6.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0536540150642395, -0.05201989412307739, -0.05038577690720558, -0.04875165969133377, -0.04711753875017166, -0.04548341780900955, -0.04384930059313774, -0.04221518337726593, -0.04058106243610382, -0.03894694149494171, -0.0373128242790699, -0.03567870706319809, -0.03404458612203598, -0.03241046518087387, -0.03077634796500206, -0.0291422288864851, -0.02750810980796814, -0.02587399072945118, -0.02423987165093422, -0.02260575257241726, -0.0209716334939003, -0.01933751441538334, -0.01770339533686638, -0.01606927625834942, -0.014435157179832458, -0.012801038101315498, -0.011166919022798538, -0.009532799944281578, -0.007898680865764618, -0.006264561787247658, -0.004630442708730698, -0.0029963236302137375, -0.0013622045516967773, 0.0002719145268201828, 0.001906033605337143, 0.003540152683854103, 0.005174271762371063, 0.006808390840888023, 0.008442509919404984, 0.010076628997921944, 0.011710748076438904, 0.013344867154955864, 0.014978986233472824, 0.016613105311989784, 0.018247224390506744, 0.019881343469023705, 0.021515462547540665, 0.023149581626057625, 0.024783700704574585, 0.026417819783091545, 0.028051938861608505, 0.029686057940125465, 0.031320177018642426, 0.032954297959804535, 0.034588415175676346, 0.03622253239154816, 0.037856653332710266, 0.039490774273872375, 0.041124891489744186, 0.042759008705616, 0.04439312964677811, 0.046027250587940216, 0.04766136780381203, 0.04929548501968384, 0.05092960596084595]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 5.0, 7.0, 6.0, 10.0, 12.0, 15.0, 24.0, 23.0, 41.0, 65.0, 78.0, 130.0, 231.0, 440.0, 986.0, 2724.0, 9544.0, 42830.0, 532442.0, 3401764.0, 167326.0, 24301.0, 6659.0, 2375.0, 1194.0, 495.0, 241.0, 129.0, 67.0, 39.0, 27.0, 21.0, 10.0, 8.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.019561767578125, -0.019037723541259766, -0.01851367950439453, -0.017989635467529297, -0.017465591430664062, -0.016941547393798828, -0.016417503356933594, -0.01589345932006836, -0.015369415283203125, -0.01484537124633789, -0.014321327209472656, -0.013797283172607422, -0.013273239135742188, -0.012749195098876953, -0.012225151062011719, -0.011701107025146484, -0.01117706298828125, -0.010653018951416016, -0.010128974914550781, -0.009604930877685547, -0.009080886840820312, -0.008556842803955078, -0.008032798767089844, -0.007508754730224609, -0.006984710693359375, -0.006460666656494141, -0.005936622619628906, -0.005412578582763672, -0.0048885345458984375, -0.004364490509033203, -0.0038404464721679688, -0.0033164024353027344, -0.0027923583984375, -0.0022683143615722656, -0.0017442703247070312, -0.0012202262878417969, -0.0006961822509765625, -0.00017213821411132812, 0.00035190582275390625, 0.0008759498596191406, 0.001399993896484375, 0.0019240379333496094, 0.0024480819702148438, 0.002972126007080078, 0.0034961700439453125, 0.004020214080810547, 0.004544258117675781, 0.005068302154541016, 0.00559234619140625, 0.006116390228271484, 0.006640434265136719, 0.007164478302001953, 0.0076885223388671875, 0.008212566375732422, 0.008736610412597656, 0.00926065444946289, 0.009784698486328125, 0.01030874252319336, 0.010832786560058594, 0.011356830596923828, 0.011880874633789062, 0.012404918670654297, 0.012928962707519531, 0.013453006744384766, 0.01397705078125]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 12.0, 11.0, 48.0, 75.0, 136.0, 179.0, 191.0, 154.0, 105.0, 60.0, 18.0, 10.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022613525390625, -0.022064924240112305, -0.02151632308959961, -0.020967721939086914, -0.02041912078857422, -0.019870519638061523, -0.019321918487548828, -0.018773317337036133, -0.018224716186523438, -0.017676115036010742, -0.017127513885498047, -0.01657891273498535, -0.016030311584472656, -0.015481710433959961, -0.014933109283447266, -0.01438450813293457, -0.013835906982421875, -0.01328730583190918, -0.012738704681396484, -0.012190103530883789, -0.011641502380371094, -0.011092901229858398, -0.010544300079345703, -0.009995698928833008, -0.009447097778320312, -0.008898496627807617, -0.008349895477294922, -0.0078012943267822266, -0.007252693176269531, -0.006704092025756836, -0.006155490875244141, -0.005606889724731445, -0.00505828857421875, -0.004509687423706055, -0.003961086273193359, -0.003412485122680664, -0.0028638839721679688, -0.0023152828216552734, -0.0017666816711425781, -0.0012180805206298828, -0.0006694793701171875, -0.00012087821960449219, 0.0004277229309082031, 0.0009763240814208984, 0.0015249252319335938, 0.002073526382446289, 0.0026221275329589844, 0.0031707286834716797, 0.003719329833984375, 0.00426793098449707, 0.004816532135009766, 0.005365133285522461, 0.005913734436035156, 0.0064623355865478516, 0.007010936737060547, 0.007559537887573242, 0.008108139038085938, 0.008656740188598633, 0.009205341339111328, 0.009753942489624023, 0.010302543640136719, 0.010851144790649414, 0.01139974594116211, 0.011948347091674805, 0.0124969482421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 10.0, 13.0, 16.0, 32.0, 63.0, 89.0, 120.0, 207.0, 381.0, 653.0, 1262.0, 2630.0, 6114.0, 16225.0, 55751.0, 303104.0, 3244012.0, 460031.0, 70972.0, 19500.0, 6945.0, 2906.0, 1402.0, 739.0, 437.0, 248.0, 147.0, 82.0, 57.0, 32.0, 25.0, 29.0, 9.0, 12.0, 5.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.01483917236328125, -0.014422178268432617, -0.014005184173583984, -0.013588190078735352, -0.013171195983886719, -0.012754201889038086, -0.012337207794189453, -0.01192021369934082, -0.011503219604492188, -0.011086225509643555, -0.010669231414794922, -0.010252237319946289, -0.009835243225097656, -0.009418249130249023, -0.00900125503540039, -0.008584260940551758, -0.008167266845703125, -0.007750272750854492, -0.007333278656005859, -0.0069162845611572266, -0.006499290466308594, -0.006082296371459961, -0.005665302276611328, -0.005248308181762695, -0.0048313140869140625, -0.00441431999206543, -0.003997325897216797, -0.003580331802368164, -0.0031633377075195312, -0.0027463436126708984, -0.0023293495178222656, -0.0019123554229736328, -0.001495361328125, -0.0010783672332763672, -0.0006613731384277344, -0.00024437904357910156, 0.00017261505126953125, 0.0005896091461181641, 0.0010066032409667969, 0.0014235973358154297, 0.0018405914306640625, 0.0022575855255126953, 0.002674579620361328, 0.003091573715209961, 0.0035085678100585938, 0.0039255619049072266, 0.004342555999755859, 0.004759550094604492, 0.005176544189453125, 0.005593538284301758, 0.006010532379150391, 0.0064275264739990234, 0.006844520568847656, 0.007261514663696289, 0.007678508758544922, 0.008095502853393555, 0.008512496948242188, 0.00892949104309082, 0.009346485137939453, 0.009763479232788086, 0.010180473327636719, 0.010597467422485352, 0.011014461517333984, 0.011431455612182617, 0.01184844970703125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 5.0, 11.0, 12.0, 11.0, 20.0, 30.0, 50.0, 91.0, 127.0, 237.0, 563.0, 1262.0, 847.0, 345.0, 165.0, 93.0, 70.0, 38.0, 28.0, 16.0, 13.0, 12.0, 8.0, 4.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0146484375, -0.014169931411743164, -0.013691425323486328, -0.013212919235229492, -0.012734413146972656, -0.01225590705871582, -0.011777400970458984, -0.011298894882202148, -0.010820388793945312, -0.010341882705688477, -0.00986337661743164, -0.009384870529174805, -0.008906364440917969, -0.008427858352661133, -0.007949352264404297, -0.007470846176147461, -0.006992340087890625, -0.006513833999633789, -0.006035327911376953, -0.005556821823120117, -0.005078315734863281, -0.004599809646606445, -0.004121303558349609, -0.0036427974700927734, -0.0031642913818359375, -0.0026857852935791016, -0.0022072792053222656, -0.0017287731170654297, -0.0012502670288085938, -0.0007717609405517578, -0.0002932548522949219, 0.00018525123596191406, 0.00066375732421875, 0.001142263412475586, 0.0016207695007324219, 0.002099275588989258, 0.0025777816772460938, 0.0030562877655029297, 0.0035347938537597656, 0.0040132999420166016, 0.0044918060302734375, 0.0049703121185302734, 0.005448818206787109, 0.005927324295043945, 0.006405830383300781, 0.006884336471557617, 0.007362842559814453, 0.007841348648071289, 0.008319854736328125, 0.008798360824584961, 0.009276866912841797, 0.009755373001098633, 0.010233879089355469, 0.010712385177612305, 0.01119089126586914, 0.011669397354125977, 0.012147903442382812, 0.012626409530639648, 0.013104915618896484, 0.01358342170715332, 0.014061927795410156, 0.014540433883666992, 0.015018939971923828, 0.015497446060180664, 0.0159759521484375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 9.0, 14.0, 22.0, 69.0, 151.0, 250.0, 257.0, 131.0, 45.0, 32.0, 8.0, 5.0, 5.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10587139427661896, -0.10149287432432175, -0.09711436182260513, -0.09273584187030792, -0.08835732936859131, -0.0839788094162941, -0.07960028946399689, -0.07522177696228027, -0.07084325700998306, -0.06646473705768585, -0.06208622455596924, -0.05770770460367203, -0.053329188376665115, -0.0489506721496582, -0.04457215219736099, -0.04019363597035408, -0.03581511974334717, -0.031436603516340256, -0.027058085426688194, -0.022679567337036133, -0.01830105111002922, -0.013922534883022308, -0.009544016793370247, -0.005165498703718185, -0.0007869824767112732, 0.0035915346816182137, 0.0079700518399477, 0.012348568998277187, 0.016727086156606674, 0.021105602383613586, 0.025484120473265648, 0.02986263856291771, 0.03424115478992462, 0.038619671016931534, 0.042998187243938446, 0.04737670719623566, 0.05175522342324257, 0.05613373965024948, 0.06051225960254669, 0.0648907721042633, 0.06926929205656052, 0.07364781200885773, 0.07802632451057434, 0.08240484446287155, 0.08678336441516876, 0.09116187691688538, 0.09554039686918259, 0.0999189168214798, 0.10429742932319641, 0.10867594927549362, 0.11305446177721024, 0.11743298172950745, 0.12181149423122406, 0.12619000673294067, 0.13056853413581848, 0.1349470466375351, 0.1393255591392517, 0.14370407164096832, 0.14808259904384613, 0.15246111154556274, 0.15683962404727936, 0.16121813654899597, 0.16559666395187378, 0.1699751764535904, 0.1743537038564682]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0, 7.0, 4.0, 7.0, 9.0, 7.0, 6.0, 18.0, 8.0, 21.0, 14.0, 22.0, 21.0, 18.0, 27.0, 34.0, 41.0, 32.0, 38.0, 40.0, 46.0, 39.0, 36.0, 41.0, 37.0, 45.0, 40.0, 39.0, 33.0, 41.0, 36.0, 19.0, 32.0, 29.0, 18.0, 14.0, 13.0, 13.0, 19.0, 16.0, 6.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03565680980682373, -0.03460201621055603, -0.03354722261428833, -0.03249242529273033, -0.03143763169646263, -0.03038283810019493, -0.02932804264128208, -0.028273247182369232, -0.027218453586101532, -0.026163659989833832, -0.025108864530920982, -0.024054069072008133, -0.022999275475740433, -0.021944481879472733, -0.020889686420559883, -0.019834890961647034, -0.018780097365379333, -0.017725303769111633, -0.016670508310198784, -0.015615713782608509, -0.014560919255018234, -0.01350612472742796, -0.012451330199837685, -0.01139653567224741, -0.010341741144657135, -0.00928694661706686, -0.008232152089476585, -0.007177357561886311, -0.006122563034296036, -0.005067768506705761, -0.004012973979115486, -0.0029581794515252113, -0.0019033849239349365, -0.0008485903963446617, 0.0002062041312456131, 0.001260998658835888, 0.0023157931864261627, 0.0033705877140164375, 0.004425382241606712, 0.005480176769196987, 0.006534971296787262, 0.007589765824377537, 0.008644560351967812, 0.009699354879558086, 0.010754149407148361, 0.011808943934738636, 0.01286373846232891, 0.013918532989919186, 0.01497332751750946, 0.01602812111377716, 0.01708291657269001, 0.01813771203160286, 0.01919250562787056, 0.02024729922413826, 0.02130209468305111, 0.02235689014196396, 0.02341168373823166, 0.02446647733449936, 0.02552127279341221, 0.026576068252325058, 0.027630861848592758, 0.02868565544486046, 0.029740450903773308, 0.030795246362686157, 0.03185003995895386]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 3.0, 10.0, 4.0, 10.0, 7.0, 12.0, 28.0, 29.0, 40.0, 52.0, 66.0, 111.0, 162.0, 293.0, 530.0, 991.0, 2641.0, 9725.0, 54632.0, 375320.0, 500177.0, 83846.0, 13743.0, 3381.0, 1198.0, 573.0, 308.0, 221.0, 136.0, 76.0, 56.0, 36.0, 36.0, 25.0, 21.0, 15.0, 10.0, 8.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02374267578125, -0.02283334732055664, -0.02192401885986328, -0.021014690399169922, -0.020105361938476562, -0.019196033477783203, -0.018286705017089844, -0.017377376556396484, -0.016468048095703125, -0.015558719635009766, -0.014649391174316406, -0.013740062713623047, -0.012830734252929688, -0.011921405792236328, -0.011012077331542969, -0.01010274887084961, -0.00919342041015625, -0.00828409194946289, -0.007374763488769531, -0.006465435028076172, -0.0055561065673828125, -0.004646778106689453, -0.0037374496459960938, -0.0028281211853027344, -0.001918792724609375, -0.0010094642639160156, -0.00010013580322265625, 0.0008091926574707031, 0.0017185211181640625, 0.002627849578857422, 0.0035371780395507812, 0.004446506500244141, 0.0053558349609375, 0.006265163421630859, 0.007174491882324219, 0.008083820343017578, 0.008993148803710938, 0.009902477264404297, 0.010811805725097656, 0.011721134185791016, 0.012630462646484375, 0.013539791107177734, 0.014449119567871094, 0.015358448028564453, 0.016267776489257812, 0.017177104949951172, 0.01808643341064453, 0.01899576187133789, 0.01990509033203125, 0.02081441879272461, 0.02172374725341797, 0.022633075714111328, 0.023542404174804688, 0.024451732635498047, 0.025361061096191406, 0.026270389556884766, 0.027179718017578125, 0.028089046478271484, 0.028998374938964844, 0.029907703399658203, 0.030817031860351562, 0.03172636032104492, 0.03263568878173828, 0.03354501724243164, 0.034454345703125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 13.0, 33.0, 53.0, 110.0, 139.0, 151.0, 147.0, 144.0, 105.0, 61.0, 23.0, 11.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0221099853515625, -0.02155780792236328, -0.021005630493164062, -0.020453453063964844, -0.019901275634765625, -0.019349098205566406, -0.018796920776367188, -0.01824474334716797, -0.01769256591796875, -0.01714038848876953, -0.016588211059570312, -0.016036033630371094, -0.015483856201171875, -0.014931678771972656, -0.014379501342773438, -0.013827323913574219, -0.013275146484375, -0.012722969055175781, -0.012170791625976562, -0.011618614196777344, -0.011066436767578125, -0.010514259338378906, -0.009962081909179688, -0.009409904479980469, -0.00885772705078125, -0.008305549621582031, -0.0077533721923828125, -0.007201194763183594, -0.006649017333984375, -0.006096839904785156, -0.0055446624755859375, -0.004992485046386719, -0.0044403076171875, -0.0038881301879882812, -0.0033359527587890625, -0.0027837753295898438, -0.002231597900390625, -0.0016794204711914062, -0.0011272430419921875, -0.0005750656127929688, -2.288818359375e-05, 0.0005292892456054688, 0.0010814666748046875, 0.0016336441040039062, 0.002185821533203125, 0.0027379989624023438, 0.0032901763916015625, 0.0038423538208007812, 0.00439453125, 0.004946708679199219, 0.0054988861083984375, 0.006051063537597656, 0.006603240966796875, 0.007155418395996094, 0.0077075958251953125, 0.008259773254394531, 0.00881195068359375, 0.009364128112792969, 0.009916305541992188, 0.010468482971191406, 0.011020660400390625, 0.011572837829589844, 0.012125015258789062, 0.012677192687988281, 0.0132293701171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 7.0, 7.0, 4.0, 12.0, 14.0, 24.0, 42.0, 48.0, 66.0, 91.0, 131.0, 195.0, 344.0, 520.0, 848.0, 1718.0, 3285.0, 7414.0, 18236.0, 51282.0, 170387.0, 431251.0, 246285.0, 72932.0, 24760.0, 9602.0, 4262.0, 2046.0, 1008.0, 586.0, 373.0, 251.0, 181.0, 87.0, 78.0, 55.0, 29.0, 17.0, 13.0, 9.0, 12.0, 11.0, 13.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0179443359375, -0.0173947811126709, -0.016845226287841797, -0.016295671463012695, -0.015746116638183594, -0.015196561813354492, -0.01464700698852539, -0.014097452163696289, -0.013547897338867188, -0.012998342514038086, -0.012448787689208984, -0.011899232864379883, -0.011349678039550781, -0.01080012321472168, -0.010250568389892578, -0.009701013565063477, -0.009151458740234375, -0.008601903915405273, -0.008052349090576172, -0.00750279426574707, -0.006953239440917969, -0.006403684616088867, -0.005854129791259766, -0.005304574966430664, -0.0047550201416015625, -0.004205465316772461, -0.0036559104919433594, -0.003106355667114258, -0.0025568008422851562, -0.0020072460174560547, -0.0014576911926269531, -0.0009081363677978516, -0.00035858154296875, 0.00019097328186035156, 0.0007405281066894531, 0.0012900829315185547, 0.0018396377563476562, 0.002389192581176758, 0.0029387474060058594, 0.003488302230834961, 0.0040378570556640625, 0.004587411880493164, 0.005136966705322266, 0.005686521530151367, 0.006236076354980469, 0.00678563117980957, 0.007335186004638672, 0.007884740829467773, 0.008434295654296875, 0.008983850479125977, 0.009533405303955078, 0.01008296012878418, 0.010632514953613281, 0.011182069778442383, 0.011731624603271484, 0.012281179428100586, 0.012830734252929688, 0.013380289077758789, 0.01392984390258789, 0.014479398727416992, 0.015028953552246094, 0.015578508377075195, 0.016128063201904297, 0.0166776180267334, 0.0172271728515625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 5.0, 12.0, 13.0, 14.0, 30.0, 48.0, 56.0, 64.0, 71.0, 68.0, 81.0, 98.0, 89.0, 86.0, 56.0, 68.0, 41.0, 23.0, 20.0, 15.0, 12.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03021240234375, -0.029241085052490234, -0.02826976776123047, -0.027298450469970703, -0.026327133178710938, -0.025355815887451172, -0.024384498596191406, -0.02341318130493164, -0.022441864013671875, -0.02147054672241211, -0.020499229431152344, -0.019527912139892578, -0.018556594848632812, -0.017585277557373047, -0.01661396026611328, -0.015642642974853516, -0.01467132568359375, -0.013700008392333984, -0.012728691101074219, -0.011757373809814453, -0.010786056518554688, -0.009814739227294922, -0.008843421936035156, -0.00787210464477539, -0.006900787353515625, -0.005929470062255859, -0.004958152770996094, -0.003986835479736328, -0.0030155181884765625, -0.002044200897216797, -0.0010728836059570312, -0.00010156631469726562, 0.0008697509765625, 0.0018410682678222656, 0.0028123855590820312, 0.003783702850341797, 0.0047550201416015625, 0.005726337432861328, 0.006697654724121094, 0.007668972015380859, 0.008640289306640625, 0.00961160659790039, 0.010582923889160156, 0.011554241180419922, 0.012525558471679688, 0.013496875762939453, 0.014468193054199219, 0.015439510345458984, 0.01641082763671875, 0.017382144927978516, 0.01835346221923828, 0.019324779510498047, 0.020296096801757812, 0.021267414093017578, 0.022238731384277344, 0.02321004867553711, 0.024181365966796875, 0.02515268325805664, 0.026124000549316406, 0.027095317840576172, 0.028066635131835938, 0.029037952423095703, 0.03000926971435547, 0.030980587005615234, 0.031951904296875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 4.0, 4.0, 5.0, 5.0, 7.0, 13.0, 20.0, 22.0, 39.0, 62.0, 108.0, 173.0, 280.0, 442.0, 709.0, 1160.0, 1963.0, 3495.0, 6092.0, 11432.0, 22989.0, 52316.0, 144482.0, 372177.0, 266680.0, 90999.0, 36181.0, 16684.0, 8543.0, 4740.0, 2676.0, 1595.0, 944.0, 576.0, 351.0, 223.0, 145.0, 79.0, 45.0, 32.0, 30.0, 16.0, 9.0, 7.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.006053924560546875, -0.005879878997802734, -0.005705833435058594, -0.005531787872314453, -0.0053577423095703125, -0.005183696746826172, -0.005009651184082031, -0.004835605621337891, -0.00466156005859375, -0.004487514495849609, -0.004313468933105469, -0.004139423370361328, -0.0039653778076171875, -0.003791332244873047, -0.0036172866821289062, -0.0034432411193847656, -0.003269195556640625, -0.0030951499938964844, -0.0029211044311523438, -0.002747058868408203, -0.0025730133056640625, -0.002398967742919922, -0.0022249221801757812, -0.0020508766174316406, -0.0018768310546875, -0.0017027854919433594, -0.0015287399291992188, -0.0013546943664550781, -0.0011806488037109375, -0.0010066032409667969, -0.0008325576782226562, -0.0006585121154785156, -0.000484466552734375, -0.0003104209899902344, -0.00013637542724609375, 3.7670135498046875e-05, 0.0002117156982421875, 0.0003857612609863281, 0.0005598068237304688, 0.0007338523864746094, 0.00090789794921875, 0.0010819435119628906, 0.0012559890747070312, 0.0014300346374511719, 0.0016040802001953125, 0.0017781257629394531, 0.0019521713256835938, 0.0021262168884277344, 0.002300262451171875, 0.0024743080139160156, 0.0026483535766601562, 0.002822399139404297, 0.0029964447021484375, 0.003170490264892578, 0.0033445358276367188, 0.0035185813903808594, 0.003692626953125, 0.0038666725158691406, 0.004040718078613281, 0.004214763641357422, 0.0043888092041015625, 0.004562854766845703, 0.004736900329589844, 0.004910945892333984, 0.005084991455078125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 2.0, 4.0, 8.0, 3.0, 5.0, 15.0, 10.0, 15.0, 23.0, 24.0, 30.0, 38.0, 34.0, 54.0, 71.0, 68.0, 77.0, 84.0, 67.0, 73.0, 58.0, 44.0, 35.0, 34.0, 27.0, 20.0, 14.0, 11.0, 13.0, 15.0, 7.0, 5.0, 3.0, 2.0, 6.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.2961368560791016e-05, -3.175530582666397e-05, -3.0549243092536926e-05, -2.934318035840988e-05, -2.8137117624282837e-05, -2.6931054890155792e-05, -2.5724992156028748e-05, -2.4518929421901703e-05, -2.3312866687774658e-05, -2.2106803953647614e-05, -2.090074121952057e-05, -1.9694678485393524e-05, -1.848861575126648e-05, -1.7282553017139435e-05, -1.607649028301239e-05, -1.4870427548885345e-05, -1.36643648147583e-05, -1.2458302080631256e-05, -1.1252239346504211e-05, -1.0046176612377167e-05, -8.840113878250122e-06, -7.634051144123077e-06, -6.427988409996033e-06, -5.221925675868988e-06, -4.015862941741943e-06, -2.8098002076148987e-06, -1.603737473487854e-06, -3.976747393608093e-07, 8.083879947662354e-07, 2.01445072889328e-06, 3.2205134630203247e-06, 4.426576197147369e-06, 5.632638931274414e-06, 6.838701665401459e-06, 8.044764399528503e-06, 9.250827133655548e-06, 1.0456889867782593e-05, 1.1662952601909637e-05, 1.2869015336036682e-05, 1.4075078070163727e-05, 1.528114080429077e-05, 1.6487203538417816e-05, 1.769326627254486e-05, 1.8899329006671906e-05, 2.010539174079895e-05, 2.1311454474925995e-05, 2.251751720905304e-05, 2.3723579943180084e-05, 2.492964267730713e-05, 2.6135705411434174e-05, 2.7341768145561218e-05, 2.8547830879688263e-05, 2.9753893613815308e-05, 3.095995634794235e-05, 3.21660190820694e-05, 3.337208181619644e-05, 3.4578144550323486e-05, 3.578420728445053e-05, 3.6990270018577576e-05, 3.819633275270462e-05, 3.9402395486831665e-05, 4.060845822095871e-05, 4.1814520955085754e-05, 4.30205836892128e-05, 4.4226646423339844e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 8.0, 18.0, 26.0, 33.0, 49.0, 77.0, 148.0, 247.0, 407.0, 767.0, 1411.0, 2721.0, 5821.0, 13166.0, 38560.0, 163940.0, 543724.0, 204509.0, 45226.0, 14901.0, 6270.0, 3000.0, 1531.0, 882.0, 452.0, 295.0, 154.0, 77.0, 50.0, 33.0, 19.0, 8.0, 5.0, 3.0, 6.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.008148193359375, -0.00789797306060791, -0.00764775276184082, -0.0073975324630737305, -0.007147312164306641, -0.006897091865539551, -0.006646871566772461, -0.006396651268005371, -0.006146430969238281, -0.005896210670471191, -0.0056459903717041016, -0.005395770072937012, -0.005145549774169922, -0.004895329475402832, -0.004645109176635742, -0.004394888877868652, -0.0041446685791015625, -0.0038944482803344727, -0.003644227981567383, -0.003394007682800293, -0.003143787384033203, -0.0028935670852661133, -0.0026433467864990234, -0.0023931264877319336, -0.0021429061889648438, -0.001892685890197754, -0.001642465591430664, -0.0013922452926635742, -0.0011420249938964844, -0.0008918046951293945, -0.0006415843963623047, -0.00039136409759521484, -0.000141143798828125, 0.00010907649993896484, 0.0003592967987060547, 0.0006095170974731445, 0.0008597373962402344, 0.0011099576950073242, 0.001360177993774414, 0.001610398292541504, 0.0018606185913085938, 0.0021108388900756836, 0.0023610591888427734, 0.0026112794876098633, 0.002861499786376953, 0.003111720085144043, 0.003361940383911133, 0.0036121606826782227, 0.0038623809814453125, 0.004112601280212402, 0.004362821578979492, 0.004613041877746582, 0.004863262176513672, 0.005113482475280762, 0.0053637027740478516, 0.005613923072814941, 0.005864143371582031, 0.006114363670349121, 0.006364583969116211, 0.006614804267883301, 0.006865024566650391, 0.0071152448654174805, 0.00736546516418457, 0.00761568546295166, 0.00786590576171875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 8.0, 12.0, 11.0, 17.0, 16.0, 22.0, 34.0, 61.0, 64.0, 72.0, 76.0, 82.0, 99.0, 97.0, 84.0, 50.0, 50.0, 28.0, 22.0, 23.0, 15.0, 10.0, 9.0, 3.0, 5.0, 5.0, 2.0, 5.0, 2.0, 6.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00823974609375, -0.007995188236236572, -0.0077506303787231445, -0.007506072521209717, -0.007261514663696289, -0.007016956806182861, -0.006772398948669434, -0.006527841091156006, -0.006283283233642578, -0.00603872537612915, -0.005794167518615723, -0.005549609661102295, -0.005305051803588867, -0.0050604939460754395, -0.004815936088562012, -0.004571378231048584, -0.004326820373535156, -0.0040822625160217285, -0.0038377046585083008, -0.003593146800994873, -0.0033485889434814453, -0.0031040310859680176, -0.00285947322845459, -0.002614915370941162, -0.0023703575134277344, -0.0021257996559143066, -0.001881241798400879, -0.0016366839408874512, -0.0013921260833740234, -0.0011475682258605957, -0.000903010368347168, -0.0006584525108337402, -0.0004138946533203125, -0.00016933679580688477, 7.522106170654297e-05, 0.0003197789192199707, 0.0005643367767333984, 0.0008088946342468262, 0.001053452491760254, 0.0012980103492736816, 0.0015425682067871094, 0.0017871260643005371, 0.002031683921813965, 0.0022762417793273926, 0.0025207996368408203, 0.002765357494354248, 0.0030099153518676758, 0.0032544732093811035, 0.0034990310668945312, 0.003743588924407959, 0.003988146781921387, 0.0042327046394348145, 0.004477262496948242, 0.00472182035446167, 0.004966378211975098, 0.005210936069488525, 0.005455493927001953, 0.005700051784515381, 0.005944609642028809, 0.006189167499542236, 0.006433725357055664, 0.006678283214569092, 0.0069228410720825195, 0.007167398929595947, 0.007411956787109375]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 3.0, 8.0, 7.0, 10.0, 16.0, 34.0, 75.0, 110.0, 180.0, 212.0, 188.0, 74.0, 40.0, 18.0, 9.0, 9.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2480146288871765, -0.24268707633018494, -0.23735950887203217, -0.2320319563150406, -0.22670438885688782, -0.22137683629989624, -0.21604926884174347, -0.2107217162847519, -0.20539414882659912, -0.20006659626960754, -0.19473902881145477, -0.1894114762544632, -0.18408390879631042, -0.17875635623931885, -0.17342878878116608, -0.1681012362241745, -0.16277366876602173, -0.15744611620903015, -0.15211854875087738, -0.1467909961938858, -0.14146342873573303, -0.13613587617874146, -0.13080830872058868, -0.1254807561635971, -0.12015320360660553, -0.11482564359903336, -0.10949808359146118, -0.10417052358388901, -0.09884296357631683, -0.09351540356874466, -0.08818784356117249, -0.08286029100418091, -0.07753272354602814, -0.07220516353845596, -0.06687760353088379, -0.061550043523311615, -0.05622248351573944, -0.05089492350816727, -0.04556736722588539, -0.04023980721831322, -0.03491224721074104, -0.02958468720316887, -0.024257127195596695, -0.01892956905066967, -0.013602009043097496, -0.008274449035525322, -0.002946890890598297, 0.002380669116973877, 0.007708229124546051, 0.013035789132118225, 0.0183633491396904, 0.023690907284617424, 0.029018467292189598, 0.03434602916240692, 0.0396735854446888, 0.04500114545226097, 0.050328705459833145, 0.05565626546740532, 0.06098382547497749, 0.06631138175725937, 0.07163894176483154, 0.07696650177240372, 0.08229406177997589, 0.08762162178754807, 0.09294918179512024]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 12.0, 6.0, 12.0, 15.0, 15.0, 13.0, 22.0, 19.0, 29.0, 28.0, 29.0, 28.0, 40.0, 45.0, 36.0, 30.0, 39.0, 53.0, 56.0, 41.0, 41.0, 34.0, 35.0, 31.0, 31.0, 33.0, 36.0, 34.0, 29.0, 19.0, 15.0, 12.0, 16.0, 10.0, 15.0, 8.0, 6.0, 8.0, 5.0, 1.0, 2.0, 6.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04658132791519165, -0.04511958360671997, -0.04365783557295799, -0.042196087539196014, -0.040734343230724335, -0.039272598922252655, -0.03781085088849068, -0.0363491028547287, -0.03488735854625702, -0.03342561423778534, -0.03196386620402336, -0.030502120032906532, -0.029040373861789703, -0.027578627690672874, -0.026116881519556046, -0.024655135348439217, -0.023193389177322388, -0.02173164300620556, -0.02026989683508873, -0.0188081506639719, -0.017346404492855072, -0.015884658321738243, -0.014422912150621414, -0.012961165979504585, -0.011499419808387756, -0.010037673637270927, -0.008575927466154099, -0.00711418129503727, -0.005652435123920441, -0.004190688952803612, -0.002728942781686783, -0.001267196610569954, 0.000194549560546875, 0.001656295731663704, 0.003118041902780533, 0.004579788073897362, 0.006041534245014191, 0.00750328041613102, 0.008965026587247849, 0.010426772758364677, 0.011888518929481506, 0.013350265100598335, 0.014812011271715164, 0.016273757442831993, 0.017735503613948822, 0.01919724978506565, 0.02065899595618248, 0.02212074212729931, 0.023582488298416138, 0.025044234469532967, 0.026505980640649796, 0.027967726811766624, 0.029429472982883453, 0.030891219154000282, 0.03235296532511711, 0.03381471335887909, 0.03527645766735077, 0.03673820197582245, 0.03819995000958443, 0.039661698043346405, 0.041123442351818085, 0.042585186660289764, 0.04404693469405174, 0.04550868272781372, 0.0469704270362854]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 6.0, 6.0, 7.0, 8.0, 13.0, 10.0, 12.0, 14.0, 25.0, 37.0, 63.0, 85.0, 191.0, 369.0, 1077.0, 3793.0, 21385.0, 364336.0, 3692653.0, 93191.0, 12401.0, 3165.0, 865.0, 279.0, 99.0, 79.0, 37.0, 27.0, 17.0, 10.0, 8.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03387451171875, -0.03296685218811035, -0.0320591926574707, -0.031151533126831055, -0.030243873596191406, -0.029336214065551758, -0.02842855453491211, -0.02752089500427246, -0.026613235473632812, -0.025705575942993164, -0.024797916412353516, -0.023890256881713867, -0.02298259735107422, -0.02207493782043457, -0.021167278289794922, -0.020259618759155273, -0.019351959228515625, -0.018444299697875977, -0.017536640167236328, -0.01662898063659668, -0.01572132110595703, -0.014813661575317383, -0.013906002044677734, -0.012998342514038086, -0.012090682983398438, -0.011183023452758789, -0.01027536392211914, -0.009367704391479492, -0.008460044860839844, -0.007552385330200195, -0.006644725799560547, -0.0057370662689208984, -0.00482940673828125, -0.0039217472076416016, -0.003014087677001953, -0.0021064281463623047, -0.0011987686157226562, -0.0002911090850830078, 0.0006165504455566406, 0.001524209976196289, 0.0024318695068359375, 0.003339529037475586, 0.004247188568115234, 0.005154848098754883, 0.006062507629394531, 0.00697016716003418, 0.007877826690673828, 0.008785486221313477, 0.009693145751953125, 0.010600805282592773, 0.011508464813232422, 0.01241612434387207, 0.013323783874511719, 0.014231443405151367, 0.015139102935791016, 0.016046762466430664, 0.016954421997070312, 0.01786208152770996, 0.01876974105834961, 0.019677400588989258, 0.020585060119628906, 0.021492719650268555, 0.022400379180908203, 0.02330803871154785, 0.0242156982421875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 8.0, 21.0, 28.0, 37.0, 75.0, 127.0, 139.0, 156.0, 159.0, 96.0, 77.0, 48.0, 24.0, 6.0, 6.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02374267578125, -0.023182988166809082, -0.022623300552368164, -0.022063612937927246, -0.021503925323486328, -0.02094423770904541, -0.020384550094604492, -0.019824862480163574, -0.019265174865722656, -0.01870548725128174, -0.01814579963684082, -0.017586112022399902, -0.017026424407958984, -0.016466736793518066, -0.01590704917907715, -0.01534736156463623, -0.014787673950195312, -0.014227986335754395, -0.013668298721313477, -0.013108611106872559, -0.01254892349243164, -0.011989235877990723, -0.011429548263549805, -0.010869860649108887, -0.010310173034667969, -0.00975048542022705, -0.009190797805786133, -0.008631110191345215, -0.008071422576904297, -0.007511734962463379, -0.006952047348022461, -0.006392359733581543, -0.005832672119140625, -0.005272984504699707, -0.004713296890258789, -0.004153609275817871, -0.003593921661376953, -0.003034234046936035, -0.002474546432495117, -0.0019148588180541992, -0.0013551712036132812, -0.0007954835891723633, -0.0002357959747314453, 0.00032389163970947266, 0.0008835792541503906, 0.0014432668685913086, 0.0020029544830322266, 0.0025626420974731445, 0.0031223297119140625, 0.0036820173263549805, 0.0042417049407958984, 0.004801392555236816, 0.005361080169677734, 0.005920767784118652, 0.00648045539855957, 0.007040143013000488, 0.007599830627441406, 0.008159518241882324, 0.008719205856323242, 0.00927889347076416, 0.009838581085205078, 0.010398268699645996, 0.010957956314086914, 0.011517643928527832, 0.01207733154296875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 5.0, 17.0, 24.0, 37.0, 54.0, 75.0, 106.0, 216.0, 262.0, 503.0, 886.0, 1802.0, 3856.0, 8869.0, 24293.0, 91653.0, 1008474.0, 2847990.0, 150743.0, 33511.0, 11384.0, 4752.0, 2203.0, 1114.0, 586.0, 341.0, 175.0, 122.0, 68.0, 39.0, 34.0, 32.0, 10.0, 17.0, 10.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186767578125, -0.018145322799682617, -0.017613887786865234, -0.01708245277404785, -0.01655101776123047, -0.016019582748413086, -0.015488147735595703, -0.01495671272277832, -0.014425277709960938, -0.013893842697143555, -0.013362407684326172, -0.012830972671508789, -0.012299537658691406, -0.011768102645874023, -0.01123666763305664, -0.010705232620239258, -0.010173797607421875, -0.009642362594604492, -0.00911092758178711, -0.008579492568969727, -0.008048057556152344, -0.007516622543334961, -0.006985187530517578, -0.006453752517700195, -0.0059223175048828125, -0.00539088249206543, -0.004859447479248047, -0.004328012466430664, -0.0037965774536132812, -0.0032651424407958984, -0.0027337074279785156, -0.002202272415161133, -0.00167083740234375, -0.0011394023895263672, -0.0006079673767089844, -7.653236389160156e-05, 0.00045490264892578125, 0.000986337661743164, 0.0015177726745605469, 0.0020492076873779297, 0.0025806427001953125, 0.0031120777130126953, 0.003643512725830078, 0.004174947738647461, 0.004706382751464844, 0.0052378177642822266, 0.005769252777099609, 0.006300687789916992, 0.006832122802734375, 0.007363557815551758, 0.00789499282836914, 0.008426427841186523, 0.008957862854003906, 0.009489297866821289, 0.010020732879638672, 0.010552167892456055, 0.011083602905273438, 0.01161503791809082, 0.012146472930908203, 0.012677907943725586, 0.013209342956542969, 0.013740777969360352, 0.014272212982177734, 0.014803647994995117, 0.0153350830078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 7.0, 13.0, 23.0, 28.0, 48.0, 89.0, 150.0, 395.0, 1193.0, 1218.0, 453.0, 170.0, 92.0, 54.0, 42.0, 25.0, 15.0, 14.0, 6.0, 7.0, 9.0, 4.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0260772705078125, -0.025390148162841797, -0.024703025817871094, -0.02401590347290039, -0.023328781127929688, -0.022641658782958984, -0.02195453643798828, -0.021267414093017578, -0.020580291748046875, -0.019893169403076172, -0.01920604705810547, -0.018518924713134766, -0.017831802368164062, -0.01714468002319336, -0.016457557678222656, -0.015770435333251953, -0.01508331298828125, -0.014396190643310547, -0.013709068298339844, -0.01302194595336914, -0.012334823608398438, -0.011647701263427734, -0.010960578918457031, -0.010273456573486328, -0.009586334228515625, -0.008899211883544922, -0.008212089538574219, -0.007524967193603516, -0.0068378448486328125, -0.006150722503662109, -0.005463600158691406, -0.004776477813720703, -0.00408935546875, -0.003402233123779297, -0.0027151107788085938, -0.0020279884338378906, -0.0013408660888671875, -0.0006537437438964844, 3.337860107421875e-05, 0.0007205009460449219, 0.001407623291015625, 0.002094745635986328, 0.0027818679809570312, 0.0034689903259277344, 0.0041561126708984375, 0.004843235015869141, 0.005530357360839844, 0.006217479705810547, 0.00690460205078125, 0.007591724395751953, 0.008278846740722656, 0.00896596908569336, 0.009653091430664062, 0.010340213775634766, 0.011027336120605469, 0.011714458465576172, 0.012401580810546875, 0.013088703155517578, 0.013775825500488281, 0.014462947845458984, 0.015150070190429688, 0.01583719253540039, 0.016524314880371094, 0.017211437225341797, 0.0178985595703125]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 7.0, 18.0, 32.0, 66.0, 155.0, 253.0, 208.0, 123.0, 71.0, 32.0, 15.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.17267051339149475, -0.16688667237758636, -0.16110284626483917, -0.1553190052509308, -0.1495351791381836, -0.1437513381242752, -0.13796749711036682, -0.13218367099761963, -0.12639982998371124, -0.12061599642038345, -0.11483216285705566, -0.10904832184314728, -0.10326448827981949, -0.0974806547164917, -0.09169682115316391, -0.08591298758983612, -0.08012915402650833, -0.07434532046318054, -0.06856148689985275, -0.06277765333652496, -0.05699381232261658, -0.05120997875928879, -0.045426145195961, -0.03964230790734291, -0.03385847434401512, -0.028074638918042183, -0.022290803492069244, -0.016506969928741455, -0.010723134502768517, -0.004939299076795578, 0.0008445344865322113, 0.006628371775150299, 0.012412205338478088, 0.018196040764451027, 0.023979876190423965, 0.029763709753751755, 0.03554754704236984, 0.04133138060569763, 0.04711521416902542, 0.05289905145764351, 0.0586828850209713, 0.06446672230958939, 0.07025055587291718, 0.07603438943624496, 0.08181822299957275, 0.08760206401348114, 0.09338589012622833, 0.09916973114013672, 0.10495356470346451, 0.1107373982667923, 0.11652123183012009, 0.12230506539344788, 0.12808890640735626, 0.13387274742126465, 0.13965657353401184, 0.14544041454792023, 0.15122424066066742, 0.1570080816745758, 0.162791907787323, 0.16857574880123138, 0.17435957491397858, 0.18014341592788696, 0.18592724204063416, 0.19171108305454254, 0.19749492406845093]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 2.0, 4.0, 7.0, 7.0, 12.0, 6.0, 7.0, 14.0, 16.0, 17.0, 14.0, 21.0, 23.0, 33.0, 26.0, 30.0, 36.0, 39.0, 36.0, 47.0, 52.0, 34.0, 46.0, 42.0, 38.0, 42.0, 37.0, 29.0, 26.0, 39.0, 26.0, 19.0, 23.0, 31.0, 21.0, 21.0, 17.0, 7.0, 15.0, 5.0, 3.0, 5.0, 8.0, 2.0, 7.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.048924267292022705, -0.04735838621854782, -0.04579250514507294, -0.044226620346307755, -0.04266073927283287, -0.041094858199357986, -0.039528973400592804, -0.03796309232711792, -0.036397211253643036, -0.03483133018016815, -0.03326544910669327, -0.031699564307928085, -0.0301336832344532, -0.028567802160978317, -0.027001919224858284, -0.02543603628873825, -0.023870155215263367, -0.022304274141788483, -0.02073839120566845, -0.019172508269548416, -0.017606627196073532, -0.016040746122598648, -0.014474863186478615, -0.012908981181681156, -0.011343099176883698, -0.009777217172086239, -0.00821133516728878, -0.0066454531624913216, -0.005079571157693863, -0.0035136891528964043, -0.0019478071480989456, -0.00038192514330148697, 0.0011839568614959717, 0.0027498388662934303, 0.004315720871090889, 0.005881602875888348, 0.007447484880685806, 0.009013366885483265, 0.010579248890280724, 0.012145130895078182, 0.013711012899875641, 0.0152768949046731, 0.016842776909470558, 0.01840865984559059, 0.019974540919065475, 0.02154042199254036, 0.023106304928660393, 0.024672187864780426, 0.02623806893825531, 0.027803950011730194, 0.029369832947850227, 0.03093571588397026, 0.032501596957445145, 0.03406747803092003, 0.03563336282968521, 0.037199243903160095, 0.03876512497663498, 0.04033100605010986, 0.04189688712358475, 0.04346277192234993, 0.045028652995824814, 0.0465945340692997, 0.04816041886806488, 0.049726299941539764, 0.05129218101501465]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 11.0, 9.0, 12.0, 16.0, 21.0, 27.0, 44.0, 50.0, 89.0, 105.0, 173.0, 263.0, 463.0, 1054.0, 2864.0, 9936.0, 44599.0, 234186.0, 542738.0, 167319.0, 32586.0, 7609.0, 2238.0, 881.0, 443.0, 250.0, 179.0, 109.0, 61.0, 65.0, 36.0, 27.0, 28.0, 13.0, 11.0, 8.0, 3.0, 2.0, 10.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.0291290283203125, -0.028256893157958984, -0.02738475799560547, -0.026512622833251953, -0.025640487670898438, -0.024768352508544922, -0.023896217346191406, -0.02302408218383789, -0.022151947021484375, -0.02127981185913086, -0.020407676696777344, -0.019535541534423828, -0.018663406372070312, -0.017791271209716797, -0.01691913604736328, -0.016047000885009766, -0.01517486572265625, -0.014302730560302734, -0.013430595397949219, -0.012558460235595703, -0.011686325073242188, -0.010814189910888672, -0.009942054748535156, -0.00906991958618164, -0.008197784423828125, -0.007325649261474609, -0.006453514099121094, -0.005581378936767578, -0.0047092437744140625, -0.003837108612060547, -0.0029649734497070312, -0.0020928382873535156, -0.001220703125, -0.0003485679626464844, 0.0005235671997070312, 0.0013957023620605469, 0.0022678375244140625, 0.003139972686767578, 0.004012107849121094, 0.004884243011474609, 0.005756378173828125, 0.006628513336181641, 0.007500648498535156, 0.008372783660888672, 0.009244918823242188, 0.010117053985595703, 0.010989189147949219, 0.011861324310302734, 0.01273345947265625, 0.013605594635009766, 0.014477729797363281, 0.015349864959716797, 0.016222000122070312, 0.017094135284423828, 0.017966270446777344, 0.01883840560913086, 0.019710540771484375, 0.02058267593383789, 0.021454811096191406, 0.022326946258544922, 0.023199081420898438, 0.024071216583251953, 0.02494335174560547, 0.025815486907958984, 0.0266876220703125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 8.0, 17.0, 34.0, 43.0, 58.0, 103.0, 113.0, 127.0, 130.0, 121.0, 90.0, 75.0, 42.0, 23.0, 12.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022430419921875, -0.021882176399230957, -0.021333932876586914, -0.02078568935394287, -0.020237445831298828, -0.019689202308654785, -0.019140958786010742, -0.0185927152633667, -0.018044471740722656, -0.017496228218078613, -0.01694798469543457, -0.016399741172790527, -0.015851497650146484, -0.015303254127502441, -0.014755010604858398, -0.014206767082214355, -0.013658523559570312, -0.01311028003692627, -0.012562036514282227, -0.012013792991638184, -0.01146554946899414, -0.010917305946350098, -0.010369062423706055, -0.009820818901062012, -0.009272575378417969, -0.008724331855773926, -0.008176088333129883, -0.00762784481048584, -0.007079601287841797, -0.006531357765197754, -0.005983114242553711, -0.005434870719909668, -0.004886627197265625, -0.004338383674621582, -0.003790140151977539, -0.003241896629333496, -0.002693653106689453, -0.00214540958404541, -0.0015971660614013672, -0.0010489225387573242, -0.0005006790161132812, 4.756450653076172e-05, 0.0005958080291748047, 0.0011440515518188477, 0.0016922950744628906, 0.0022405385971069336, 0.0027887821197509766, 0.0033370256423950195, 0.0038852691650390625, 0.0044335126876831055, 0.0049817562103271484, 0.005529999732971191, 0.006078243255615234, 0.006626486778259277, 0.00717473030090332, 0.007722973823547363, 0.008271217346191406, 0.00881946086883545, 0.009367704391479492, 0.009915947914123535, 0.010464191436767578, 0.011012434959411621, 0.011560678482055664, 0.012108922004699707, 0.01265716552734375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 4.0, 7.0, 6.0, 16.0, 18.0, 28.0, 36.0, 54.0, 65.0, 119.0, 141.0, 222.0, 367.0, 569.0, 849.0, 1292.0, 2121.0, 3387.0, 5797.0, 9911.0, 18509.0, 35845.0, 74318.0, 165731.0, 334538.0, 207977.0, 92611.0, 43204.0, 21887.0, 11753.0, 6684.0, 3940.0, 2275.0, 1540.0, 920.0, 582.0, 392.0, 263.0, 185.0, 116.0, 83.0, 64.0, 37.0, 29.0, 19.0, 13.0, 21.0, 6.0, 6.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.0136566162109375, -0.013224959373474121, -0.012793302536010742, -0.012361645698547363, -0.011929988861083984, -0.011498332023620605, -0.011066675186157227, -0.010635018348693848, -0.010203361511230469, -0.00977170467376709, -0.009340047836303711, -0.008908390998840332, -0.008476734161376953, -0.008045077323913574, -0.007613420486450195, -0.007181763648986816, -0.0067501068115234375, -0.006318449974060059, -0.00588679313659668, -0.005455136299133301, -0.005023479461669922, -0.004591822624206543, -0.004160165786743164, -0.003728508949279785, -0.0032968521118164062, -0.0028651952743530273, -0.0024335384368896484, -0.0020018815994262695, -0.0015702247619628906, -0.0011385679244995117, -0.0007069110870361328, -0.0002752542495727539, 0.000156402587890625, 0.0005880594253540039, 0.0010197162628173828, 0.0014513731002807617, 0.0018830299377441406, 0.0023146867752075195, 0.0027463436126708984, 0.0031780004501342773, 0.0036096572875976562, 0.004041314125061035, 0.004472970962524414, 0.004904627799987793, 0.005336284637451172, 0.005767941474914551, 0.00619959831237793, 0.006631255149841309, 0.0070629119873046875, 0.007494568824768066, 0.007926225662231445, 0.008357882499694824, 0.008789539337158203, 0.009221196174621582, 0.009652853012084961, 0.01008450984954834, 0.010516166687011719, 0.010947823524475098, 0.011379480361938477, 0.011811137199401855, 0.012242794036865234, 0.012674450874328613, 0.013106107711791992, 0.013537764549255371, 0.01396942138671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 1.0, 2.0, 3.0, 8.0, 8.0, 4.0, 12.0, 12.0, 16.0, 18.0, 21.0, 20.0, 34.0, 38.0, 41.0, 45.0, 46.0, 48.0, 69.0, 50.0, 45.0, 53.0, 51.0, 39.0, 54.0, 37.0, 33.0, 34.0, 36.0, 21.0, 16.0, 17.0, 19.0, 12.0, 9.0, 4.0, 3.0, 6.0, 6.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0211639404296875, -0.020483732223510742, -0.019803524017333984, -0.019123315811157227, -0.01844310760498047, -0.01776289939880371, -0.017082691192626953, -0.016402482986450195, -0.015722274780273438, -0.01504206657409668, -0.014361858367919922, -0.013681650161743164, -0.013001441955566406, -0.012321233749389648, -0.01164102554321289, -0.010960817337036133, -0.010280609130859375, -0.009600400924682617, -0.00892019271850586, -0.008239984512329102, -0.007559776306152344, -0.006879568099975586, -0.006199359893798828, -0.00551915168762207, -0.0048389434814453125, -0.004158735275268555, -0.003478527069091797, -0.002798318862915039, -0.0021181106567382812, -0.0014379024505615234, -0.0007576942443847656, -7.748603820800781e-05, 0.00060272216796875, 0.0012829303741455078, 0.0019631385803222656, 0.0026433467864990234, 0.0033235549926757812, 0.004003763198852539, 0.004683971405029297, 0.005364179611206055, 0.0060443878173828125, 0.00672459602355957, 0.007404804229736328, 0.008085012435913086, 0.008765220642089844, 0.009445428848266602, 0.01012563705444336, 0.010805845260620117, 0.011486053466796875, 0.012166261672973633, 0.01284646987915039, 0.013526678085327148, 0.014206886291503906, 0.014887094497680664, 0.015567302703857422, 0.01624751091003418, 0.016927719116210938, 0.017607927322387695, 0.018288135528564453, 0.01896834373474121, 0.01964855194091797, 0.020328760147094727, 0.021008968353271484, 0.021689176559448242, 0.022369384765625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 13.0, 12.0, 26.0, 36.0, 41.0, 56.0, 100.0, 133.0, 166.0, 297.0, 497.0, 762.0, 1317.0, 2175.0, 3761.0, 6708.0, 12855.0, 26267.0, 60302.0, 159073.0, 401732.0, 222429.0, 80855.0, 33872.0, 15968.0, 8208.0, 4427.0, 2457.0, 1506.0, 957.0, 592.0, 331.0, 226.0, 116.0, 73.0, 58.0, 50.0, 29.0, 22.0, 14.0, 11.0, 9.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-0.00484466552734375, -0.0046866536140441895, -0.004528641700744629, -0.004370629787445068, -0.004212617874145508, -0.004054605960845947, -0.0038965940475463867, -0.003738582134246826, -0.0035805702209472656, -0.003422558307647705, -0.0032645463943481445, -0.003106534481048584, -0.0029485225677490234, -0.002790510654449463, -0.0026324987411499023, -0.002474486827850342, -0.0023164749145507812, -0.0021584630012512207, -0.00200045108795166, -0.0018424391746520996, -0.001684427261352539, -0.0015264153480529785, -0.001368403434753418, -0.0012103915214538574, -0.0010523796081542969, -0.0008943676948547363, -0.0007363557815551758, -0.0005783438682556152, -0.0004203319549560547, -0.00026232004165649414, -0.0001043081283569336, 5.370378494262695e-05, 0.0002117156982421875, 0.00036972761154174805, 0.0005277395248413086, 0.0006857514381408691, 0.0008437633514404297, 0.0010017752647399902, 0.0011597871780395508, 0.0013177990913391113, 0.0014758110046386719, 0.0016338229179382324, 0.001791834831237793, 0.0019498467445373535, 0.002107858657836914, 0.0022658705711364746, 0.002423882484436035, 0.0025818943977355957, 0.0027399063110351562, 0.002897918224334717, 0.0030559301376342773, 0.003213942050933838, 0.0033719539642333984, 0.003529965877532959, 0.0036879777908325195, 0.00384598970413208, 0.004004001617431641, 0.004162013530731201, 0.004320025444030762, 0.004478037357330322, 0.004636049270629883, 0.004794061183929443, 0.004952073097229004, 0.0051100850105285645, 0.005268096923828125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 6.0, 3.0, 9.0, 2.0, 13.0, 8.0, 10.0, 12.0, 10.0, 21.0, 25.0, 58.0, 50.0, 80.0, 73.0, 92.0, 97.0, 77.0, 75.0, 61.0, 44.0, 35.0, 25.0, 26.0, 15.0, 13.0, 11.0, 14.0, 5.0, 8.0, 6.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.331899642944336e-05, -3.214646130800247e-05, -3.0973926186561584e-05, -2.9801391065120697e-05, -2.862885594367981e-05, -2.7456320822238922e-05, -2.6283785700798035e-05, -2.5111250579357147e-05, -2.393871545791626e-05, -2.2766180336475372e-05, -2.1593645215034485e-05, -2.0421110093593597e-05, -1.924857497215271e-05, -1.8076039850711823e-05, -1.6903504729270935e-05, -1.5730969607830048e-05, -1.455843448638916e-05, -1.3385899364948273e-05, -1.2213364243507385e-05, -1.1040829122066498e-05, -9.86829400062561e-06, -8.695758879184723e-06, -7.5232237577438354e-06, -6.350688636302948e-06, -5.1781535148620605e-06, -4.005618393421173e-06, -2.8330832719802856e-06, -1.6605481505393982e-06, -4.880130290985107e-07, 6.845220923423767e-07, 1.8570572137832642e-06, 3.0295923352241516e-06, 4.202127456665039e-06, 5.3746625781059265e-06, 6.547197699546814e-06, 7.719732820987701e-06, 8.892267942428589e-06, 1.0064803063869476e-05, 1.1237338185310364e-05, 1.2409873306751251e-05, 1.3582408428192139e-05, 1.4754943549633026e-05, 1.5927478671073914e-05, 1.71000137925148e-05, 1.827254891395569e-05, 1.9445084035396576e-05, 2.0617619156837463e-05, 2.179015427827835e-05, 2.2962689399719238e-05, 2.4135224521160126e-05, 2.5307759642601013e-05, 2.64802947640419e-05, 2.7652829885482788e-05, 2.8825365006923676e-05, 2.9997900128364563e-05, 3.117043524980545e-05, 3.234297037124634e-05, 3.3515505492687225e-05, 3.468804061412811e-05, 3.5860575735569e-05, 3.703311085700989e-05, 3.8205645978450775e-05, 3.937818109989166e-05, 4.055071622133255e-05, 4.172325134277344e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 9.0, 4.0, 8.0, 16.0, 20.0, 28.0, 45.0, 46.0, 99.0, 120.0, 216.0, 290.0, 476.0, 713.0, 1250.0, 2153.0, 3704.0, 6885.0, 13142.0, 26985.0, 57789.0, 135979.0, 332714.0, 260556.0, 109573.0, 48165.0, 22447.0, 11092.0, 5843.0, 3209.0, 1887.0, 1128.0, 645.0, 454.0, 281.0, 172.0, 123.0, 96.0, 51.0, 41.0, 31.0, 18.0, 13.0, 15.0, 8.0, 7.0, 4.0, 4.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.004180908203125, -0.004057496786117554, -0.003934085369110107, -0.003810673952102661, -0.003687262535095215, -0.0035638511180877686, -0.0034404397010803223, -0.003317028284072876, -0.0031936168670654297, -0.0030702054500579834, -0.002946794033050537, -0.002823382616043091, -0.0026999711990356445, -0.0025765597820281982, -0.002453148365020752, -0.0023297369480133057, -0.0022063255310058594, -0.002082914113998413, -0.001959502696990967, -0.0018360912799835205, -0.0017126798629760742, -0.001589268445968628, -0.0014658570289611816, -0.0013424456119537354, -0.001219034194946289, -0.0010956227779388428, -0.0009722113609313965, -0.0008487999439239502, -0.0007253885269165039, -0.0006019771099090576, -0.00047856569290161133, -0.00035515427589416504, -0.00023174285888671875, -0.00010833144187927246, 1.5079975128173828e-05, 0.00013849139213562012, 0.0002619028091430664, 0.0003853142261505127, 0.000508725643157959, 0.0006321370601654053, 0.0007555484771728516, 0.0008789598941802979, 0.0010023713111877441, 0.0011257827281951904, 0.0012491941452026367, 0.001372605562210083, 0.0014960169792175293, 0.0016194283962249756, 0.0017428398132324219, 0.0018662512302398682, 0.0019896626472473145, 0.0021130740642547607, 0.002236485481262207, 0.0023598968982696533, 0.0024833083152770996, 0.002606719732284546, 0.002730131149291992, 0.0028535425662994385, 0.0029769539833068848, 0.003100365400314331, 0.0032237768173217773, 0.0033471882343292236, 0.00347059965133667, 0.003594011068344116, 0.0037174224853515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 7.0, 4.0, 6.0, 13.0, 11.0, 15.0, 22.0, 22.0, 38.0, 48.0, 56.0, 69.0, 76.0, 63.0, 88.0, 88.0, 79.0, 72.0, 46.0, 35.0, 28.0, 18.0, 17.0, 19.0, 17.0, 11.0, 3.0, 3.0, 5.0, 7.0, 1.0, 9.0, 1.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.006877899169921875, -0.006689488887786865, -0.0065010786056518555, -0.006312668323516846, -0.006124258041381836, -0.005935847759246826, -0.005747437477111816, -0.005559027194976807, -0.005370616912841797, -0.005182206630706787, -0.004993796348571777, -0.004805386066436768, -0.004616975784301758, -0.004428565502166748, -0.004240155220031738, -0.0040517449378967285, -0.0038633346557617188, -0.003674924373626709, -0.0034865140914916992, -0.0032981038093566895, -0.0031096935272216797, -0.00292128324508667, -0.00273287296295166, -0.0025444626808166504, -0.0023560523986816406, -0.002167642116546631, -0.001979231834411621, -0.0017908215522766113, -0.0016024112701416016, -0.0014140009880065918, -0.001225590705871582, -0.0010371804237365723, -0.0008487701416015625, -0.0006603598594665527, -0.00047194957733154297, -0.0002835392951965332, -9.512901306152344e-05, 9.328126907348633e-05, 0.0002816915512084961, 0.00047010183334350586, 0.0006585121154785156, 0.0008469223976135254, 0.0010353326797485352, 0.001223742961883545, 0.0014121532440185547, 0.0016005635261535645, 0.0017889738082885742, 0.001977384090423584, 0.0021657943725585938, 0.0023542046546936035, 0.0025426149368286133, 0.002731025218963623, 0.002919435501098633, 0.0031078457832336426, 0.0032962560653686523, 0.003484666347503662, 0.003673076629638672, 0.0038614869117736816, 0.004049897193908691, 0.004238307476043701, 0.004426717758178711, 0.004615128040313721, 0.0048035383224487305, 0.00499194860458374, 0.00518035888671875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 6.0, 10.0, 16.0, 12.0, 27.0, 42.0, 70.0, 95.0, 122.0, 130.0, 143.0, 108.0, 67.0, 53.0, 43.0, 24.0, 12.0, 7.0, 6.0, 4.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10547107458114624, -0.10155969858169556, -0.09764831513166428, -0.09373693913221359, -0.08982555568218231, -0.08591417968273163, -0.08200280368328094, -0.07809142768383026, -0.07418004423379898, -0.0702686682343483, -0.06635728478431702, -0.06244590878486633, -0.05853452906012535, -0.05462314933538437, -0.050711773335933685, -0.0468003936111927, -0.04288901388645172, -0.03897763416171074, -0.03506625443696976, -0.031154878437519073, -0.02724349871277809, -0.02333211898803711, -0.019420741125941277, -0.015509363263845444, -0.011597983539104462, -0.007686604745686054, -0.003775225952267647, 0.00013615284115076065, 0.004047531634569168, 0.00795891135931015, 0.011870289221405983, 0.015781667083501816, 0.019693046808242798, 0.02360442653298378, 0.027515804395079613, 0.031427182257175446, 0.03533856198191643, 0.03924994170665741, 0.04316131770610809, 0.047072697430849075, 0.05098407715559006, 0.05489545688033104, 0.05880683660507202, 0.0627182126045227, 0.06662958860397339, 0.07054097205400467, 0.07445234805345535, 0.07836373150348663, 0.08227510750293732, 0.086186483502388, 0.09009786695241928, 0.09400924295186996, 0.09792062640190125, 0.10183200240135193, 0.10574337840080261, 0.1096547544002533, 0.11356613785028458, 0.11747751384973526, 0.12138889729976654, 0.12530027329921722, 0.1292116492986679, 0.13312304019927979, 0.13703441619873047, 0.14094579219818115, 0.14485716819763184]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 1.0, 8.0, 6.0, 3.0, 5.0, 14.0, 11.0, 23.0, 17.0, 19.0, 15.0, 13.0, 24.0, 27.0, 32.0, 37.0, 44.0, 47.0, 39.0, 44.0, 54.0, 48.0, 60.0, 39.0, 52.0, 47.0, 26.0, 36.0, 38.0, 33.0, 24.0, 26.0, 18.0, 11.0, 9.0, 9.0, 7.0, 7.0, 6.0, 9.0, 3.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.06374287605285645, -0.061899974942207336, -0.06005707383155823, -0.05821417644619942, -0.05637127533555031, -0.0545283742249012, -0.05268547683954239, -0.05084257572889328, -0.04899967461824417, -0.04715677350759506, -0.04531387239694595, -0.04347097501158714, -0.041628073900938034, -0.039785172790288925, -0.037942275404930115, -0.036099374294281006, -0.0342564731836319, -0.03241357207298279, -0.03057067282497883, -0.02872777357697487, -0.02688487246632576, -0.02504197135567665, -0.02319907210767269, -0.02135617285966873, -0.019513271749019623, -0.017670370638370514, -0.015827471390366554, -0.01398457121104002, -0.012141671031713486, -0.010298770852386951, -0.008455870673060417, -0.006612970493733883, -0.004770070314407349, -0.0029271701350808144, -0.00108426995575428, 0.0007586302235722542, 0.0026015304028987885, 0.004444430582225323, 0.006287330761551857, 0.008130230940878391, 0.009973131120204926, 0.01181603129953146, 0.013658931478857994, 0.015501831658184528, 0.017344731837511063, 0.01918763294816017, 0.02103053219616413, 0.02287343144416809, 0.0247163325548172, 0.02655923366546631, 0.028402132913470268, 0.030245032161474228, 0.03208793327212334, 0.033930834382772446, 0.035773731768131256, 0.037616632878780365, 0.039459533989429474, 0.04130243510007858, 0.04314533621072769, 0.0449882335960865, 0.04683113470673561, 0.04867403581738472, 0.05051693320274353, 0.05235983431339264, 0.05420273542404175]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 11.0, 4.0, 5.0, 7.0, 18.0, 14.0, 23.0, 32.0, 41.0, 50.0, 71.0, 95.0, 125.0, 203.0, 323.0, 563.0, 969.0, 2101.0, 5141.0, 15510.0, 62277.0, 381236.0, 2625715.0, 942184.0, 116262.0, 26745.0, 8363.0, 3167.0, 1344.0, 689.0, 371.0, 219.0, 133.0, 77.0, 49.0, 45.0, 29.0, 17.0, 22.0, 9.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.032073974609375, -0.031223058700561523, -0.030372142791748047, -0.02952122688293457, -0.028670310974121094, -0.027819395065307617, -0.02696847915649414, -0.026117563247680664, -0.025266647338867188, -0.02441573143005371, -0.023564815521240234, -0.022713899612426758, -0.02186298370361328, -0.021012067794799805, -0.020161151885986328, -0.01931023597717285, -0.018459320068359375, -0.0176084041595459, -0.016757488250732422, -0.015906572341918945, -0.015055656433105469, -0.014204740524291992, -0.013353824615478516, -0.012502908706665039, -0.011651992797851562, -0.010801076889038086, -0.00995016098022461, -0.009099245071411133, -0.008248329162597656, -0.00739741325378418, -0.006546497344970703, -0.0056955814361572266, -0.00484466552734375, -0.0039937496185302734, -0.003142833709716797, -0.0022919178009033203, -0.0014410018920898438, -0.0005900859832763672, 0.0002608299255371094, 0.001111745834350586, 0.0019626617431640625, 0.002813577651977539, 0.0036644935607910156, 0.004515409469604492, 0.005366325378417969, 0.006217241287231445, 0.007068157196044922, 0.007919073104858398, 0.008769989013671875, 0.009620904922485352, 0.010471820831298828, 0.011322736740112305, 0.012173652648925781, 0.013024568557739258, 0.013875484466552734, 0.014726400375366211, 0.015577316284179688, 0.016428232192993164, 0.01727914810180664, 0.018130064010620117, 0.018980979919433594, 0.01983189582824707, 0.020682811737060547, 0.021533727645874023, 0.0223846435546875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 8.0, 23.0, 27.0, 23.0, 66.0, 85.0, 109.0, 152.0, 123.0, 121.0, 94.0, 80.0, 55.0, 18.0, 11.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0233612060546875, -0.022793292999267578, -0.022225379943847656, -0.021657466888427734, -0.021089553833007812, -0.02052164077758789, -0.01995372772216797, -0.019385814666748047, -0.018817901611328125, -0.018249988555908203, -0.01768207550048828, -0.01711416244506836, -0.016546249389648438, -0.015978336334228516, -0.015410423278808594, -0.014842510223388672, -0.01427459716796875, -0.013706684112548828, -0.013138771057128906, -0.012570858001708984, -0.012002944946289062, -0.01143503189086914, -0.010867118835449219, -0.010299205780029297, -0.009731292724609375, -0.009163379669189453, -0.008595466613769531, -0.00802755355834961, -0.0074596405029296875, -0.006891727447509766, -0.006323814392089844, -0.005755901336669922, -0.00518798828125, -0.004620075225830078, -0.004052162170410156, -0.0034842491149902344, -0.0029163360595703125, -0.0023484230041503906, -0.0017805099487304688, -0.0012125968933105469, -0.000644683837890625, -7.677078247070312e-05, 0.0004911422729492188, 0.0010590553283691406, 0.0016269683837890625, 0.0021948814392089844, 0.0027627944946289062, 0.003330707550048828, 0.00389862060546875, 0.004466533660888672, 0.005034446716308594, 0.005602359771728516, 0.0061702728271484375, 0.006738185882568359, 0.007306098937988281, 0.007874011993408203, 0.008441925048828125, 0.009009838104248047, 0.009577751159667969, 0.01014566421508789, 0.010713577270507812, 0.011281490325927734, 0.011849403381347656, 0.012417316436767578, 0.0129852294921875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 6.0, 4.0, 17.0, 16.0, 19.0, 28.0, 34.0, 56.0, 75.0, 96.0, 135.0, 173.0, 310.0, 469.0, 816.0, 1474.0, 2603.0, 5283.0, 12221.0, 32176.0, 114239.0, 665271.0, 2735319.0, 484312.0, 91185.0, 27294.0, 10353.0, 4582.0, 2354.0, 1277.0, 763.0, 426.0, 291.0, 169.0, 130.0, 102.0, 62.0, 39.0, 37.0, 16.0, 12.0, 13.0, 12.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.020751953125, -0.02006983757019043, -0.01938772201538086, -0.01870560646057129, -0.01802349090576172, -0.01734137535095215, -0.016659259796142578, -0.015977144241333008, -0.015295028686523438, -0.014612913131713867, -0.013930797576904297, -0.013248682022094727, -0.012566566467285156, -0.011884450912475586, -0.011202335357666016, -0.010520219802856445, -0.009838104248046875, -0.009155988693237305, -0.008473873138427734, -0.007791757583618164, -0.007109642028808594, -0.0064275264739990234, -0.005745410919189453, -0.005063295364379883, -0.0043811798095703125, -0.003699064254760742, -0.003016948699951172, -0.0023348331451416016, -0.0016527175903320312, -0.0009706020355224609, -0.0002884864807128906, 0.0003936290740966797, 0.00107574462890625, 0.0017578601837158203, 0.0024399757385253906, 0.003122091293334961, 0.0038042068481445312, 0.0044863224029541016, 0.005168437957763672, 0.005850553512573242, 0.0065326690673828125, 0.007214784622192383, 0.007896900177001953, 0.008579015731811523, 0.009261131286621094, 0.009943246841430664, 0.010625362396240234, 0.011307477951049805, 0.011989593505859375, 0.012671709060668945, 0.013353824615478516, 0.014035940170288086, 0.014718055725097656, 0.015400171279907227, 0.016082286834716797, 0.016764402389526367, 0.017446517944335938, 0.018128633499145508, 0.018810749053955078, 0.01949286460876465, 0.02017498016357422, 0.02085709571838379, 0.02153921127319336, 0.02222132682800293, 0.0229034423828125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 1.0, 2.0, 8.0, 14.0, 6.0, 13.0, 22.0, 24.0, 32.0, 37.0, 57.0, 74.0, 116.0, 209.0, 328.0, 490.0, 622.0, 547.0, 437.0, 330.0, 222.0, 131.0, 97.0, 57.0, 48.0, 34.0, 31.0, 15.0, 16.0, 16.0, 7.0, 2.0, 7.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.03570556640625, -0.03473210334777832, -0.03375864028930664, -0.03278517723083496, -0.03181171417236328, -0.0308382511138916, -0.029864788055419922, -0.028891324996948242, -0.027917861938476562, -0.026944398880004883, -0.025970935821533203, -0.024997472763061523, -0.024024009704589844, -0.023050546646118164, -0.022077083587646484, -0.021103620529174805, -0.020130157470703125, -0.019156694412231445, -0.018183231353759766, -0.017209768295288086, -0.016236305236816406, -0.015262842178344727, -0.014289379119873047, -0.013315916061401367, -0.012342453002929688, -0.011368989944458008, -0.010395526885986328, -0.009422063827514648, -0.008448600769042969, -0.007475137710571289, -0.006501674652099609, -0.00552821159362793, -0.00455474853515625, -0.0035812854766845703, -0.0026078224182128906, -0.001634359359741211, -0.0006608963012695312, 0.00031256675720214844, 0.0012860298156738281, 0.002259492874145508, 0.0032329559326171875, 0.004206418991088867, 0.005179882049560547, 0.0061533451080322266, 0.007126808166503906, 0.008100271224975586, 0.009073734283447266, 0.010047197341918945, 0.011020660400390625, 0.011994123458862305, 0.012967586517333984, 0.013941049575805664, 0.014914512634277344, 0.015887975692749023, 0.016861438751220703, 0.017834901809692383, 0.018808364868164062, 0.019781827926635742, 0.020755290985107422, 0.0217287540435791, 0.02270221710205078, 0.02367568016052246, 0.02464914321899414, 0.02562260627746582, 0.0265960693359375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 7.0, 4.0, 6.0, 5.0, 12.0, 26.0, 58.0, 72.0, 144.0, 196.0, 157.0, 125.0, 65.0, 42.0, 27.0, 20.0, 7.0, 14.0, 5.0, 3.0, 3.0, 10.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7125900983810425, -0.6940808892250061, -0.675571620464325, -0.6570624113082886, -0.6385531425476074, -0.620043933391571, -0.6015347242355347, -0.5830254554748535, -0.5645162463188171, -0.5460070371627808, -0.5274977684020996, -0.5089885592460632, -0.49047932028770447, -0.4719700813293457, -0.4534608721733093, -0.43495163321495056, -0.4164423942565918, -0.39793315529823303, -0.37942391633987427, -0.3609147071838379, -0.3424054682254791, -0.32389622926712036, -0.305387020111084, -0.2868777811527252, -0.26836854219436646, -0.2498593032360077, -0.23135007917881012, -0.21284085512161255, -0.19433161616325378, -0.17582237720489502, -0.15731315314769745, -0.13880392909049988, -0.1202947199344635, -0.10178548842668533, -0.08327625691890717, -0.064767025411129, -0.04625779390335083, -0.027748562395572662, -0.009239330887794495, 0.009269893169403076, 0.02777913212776184, 0.04628836363554001, 0.06479759514331818, 0.08330682665109634, 0.10181605815887451, 0.12032528966665268, 0.13883452117443085, 0.15734374523162842, 0.17585298418998718, 0.19436222314834595, 0.21287144720554352, 0.2313806712627411, 0.24988991022109985, 0.2683991491794586, 0.2869083881378174, 0.30541759729385376, 0.3239268362522125, 0.3424360752105713, 0.36094528436660767, 0.37945452332496643, 0.3979637622833252, 0.41647300124168396, 0.4349822402000427, 0.4534914493560791, 0.47200068831443787]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 4.0, 7.0, 8.0, 16.0, 23.0, 16.0, 30.0, 47.0, 57.0, 58.0, 74.0, 75.0, 83.0, 91.0, 71.0, 72.0, 69.0, 45.0, 34.0, 37.0, 33.0, 19.0, 8.0, 11.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34489548206329346, -0.3330124318599701, -0.32112938165664673, -0.30924636125564575, -0.2973633110523224, -0.285480260848999, -0.27359724044799805, -0.2617141902446747, -0.24983114004135132, -0.23794808983802795, -0.22606505453586578, -0.2141820192337036, -0.20229896903038025, -0.19041591882705688, -0.17853288352489471, -0.16664984822273254, -0.15476679801940918, -0.14288374781608582, -0.13100071251392365, -0.11911766976118088, -0.10723462700843811, -0.09535158425569534, -0.08346854150295258, -0.07158549875020981, -0.05970245599746704, -0.047819413244724274, -0.035936370491981506, -0.02405332773923874, -0.012170284986495972, -0.00028724223375320435, 0.011595800518989563, 0.02347884327173233, 0.0353618860244751, 0.047244928777217865, 0.05912797152996063, 0.0710110142827034, 0.08289405703544617, 0.09477709978818893, 0.1066601425409317, 0.11854318529367447, 0.13042622804641724, 0.1423092782497406, 0.15419231355190277, 0.16607534885406494, 0.1779583990573883, 0.18984144926071167, 0.20172448456287384, 0.213607519865036, 0.22549057006835938, 0.23737362027168274, 0.2492566555738449, 0.2611396908760071, 0.27302274107933044, 0.2849057912826538, 0.2967888116836548, 0.30867186188697815, 0.3205549120903015, 0.3324379622936249, 0.34432101249694824, 0.3562040328979492, 0.3680870831012726, 0.37997013330459595, 0.3918531537055969, 0.4037362039089203, 0.41561925411224365]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 9.0, 4.0, 7.0, 17.0, 31.0, 22.0, 44.0, 60.0, 83.0, 130.0, 181.0, 270.0, 400.0, 638.0, 1003.0, 1625.0, 2664.0, 4816.0, 8987.0, 18634.0, 42917.0, 113525.0, 311011.0, 329524.0, 123619.0, 46256.0, 20047.0, 9623.0, 4982.0, 2797.0, 1658.0, 1052.0, 633.0, 402.0, 264.0, 192.0, 124.0, 79.0, 64.0, 45.0, 32.0, 28.0, 15.0, 15.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.021697998046875, -0.02099895477294922, -0.020299911499023438, -0.019600868225097656, -0.018901824951171875, -0.018202781677246094, -0.017503738403320312, -0.01680469512939453, -0.01610565185546875, -0.015406608581542969, -0.014707565307617188, -0.014008522033691406, -0.013309478759765625, -0.012610435485839844, -0.011911392211914062, -0.011212348937988281, -0.0105133056640625, -0.009814262390136719, -0.009115219116210938, -0.008416175842285156, -0.007717132568359375, -0.007018089294433594, -0.0063190460205078125, -0.005620002746582031, -0.00492095947265625, -0.004221916198730469, -0.0035228729248046875, -0.0028238296508789062, -0.002124786376953125, -0.0014257431030273438, -0.0007266998291015625, -2.765655517578125e-05, 0.00067138671875, 0.0013704299926757812, 0.0020694732666015625, 0.0027685165405273438, 0.003467559814453125, 0.004166603088378906, 0.0048656463623046875, 0.005564689636230469, 0.00626373291015625, 0.006962776184082031, 0.0076618194580078125, 0.008360862731933594, 0.009059906005859375, 0.009758949279785156, 0.010457992553710938, 0.011157035827636719, 0.0118560791015625, 0.012555122375488281, 0.013254165649414062, 0.013953208923339844, 0.014652252197265625, 0.015351295471191406, 0.016050338745117188, 0.01674938201904297, 0.01744842529296875, 0.01814746856689453, 0.018846511840820312, 0.019545555114746094, 0.020244598388671875, 0.020943641662597656, 0.021642684936523438, 0.02234172821044922, 0.023040771484375]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 7.0, 10.0, 12.0, 13.0, 32.0, 50.0, 60.0, 70.0, 80.0, 83.0, 114.0, 117.0, 102.0, 76.0, 54.0, 36.0, 24.0, 10.0, 12.0, 13.0, 7.0, 5.0, 9.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.032379150390625, -0.03138160705566406, -0.030384063720703125, -0.029386520385742188, -0.02838897705078125, -0.027391433715820312, -0.026393890380859375, -0.025396347045898438, -0.0243988037109375, -0.023401260375976562, -0.022403717041015625, -0.021406173706054688, -0.02040863037109375, -0.019411087036132812, -0.018413543701171875, -0.017416000366210938, -0.01641845703125, -0.015420913696289062, -0.014423370361328125, -0.013425827026367188, -0.01242828369140625, -0.011430740356445312, -0.010433197021484375, -0.009435653686523438, -0.0084381103515625, -0.0074405670166015625, -0.006443023681640625, -0.0054454803466796875, -0.00444793701171875, -0.0034503936767578125, -0.002452850341796875, -0.0014553070068359375, -0.000457763671875, 0.0005397796630859375, 0.001537322998046875, 0.0025348663330078125, 0.00353240966796875, 0.0045299530029296875, 0.005527496337890625, 0.0065250396728515625, 0.0075225830078125, 0.008520126342773438, 0.009517669677734375, 0.010515213012695312, 0.01151275634765625, 0.012510299682617188, 0.013507843017578125, 0.014505386352539062, 0.0155029296875, 0.016500473022460938, 0.017498016357421875, 0.018495559692382812, 0.01949310302734375, 0.020490646362304688, 0.021488189697265625, 0.022485733032226562, 0.0234832763671875, 0.024480819702148438, 0.025478363037109375, 0.026475906372070312, 0.02747344970703125, 0.028470993041992188, 0.029468536376953125, 0.030466079711914062, 0.031463623046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 6.0, 4.0, 6.0, 8.0, 17.0, 12.0, 23.0, 37.0, 35.0, 83.0, 125.0, 192.0, 390.0, 719.0, 1413.0, 3301.0, 8167.0, 25441.0, 115436.0, 727668.0, 124289.0, 26205.0, 8297.0, 3310.0, 1513.0, 781.0, 432.0, 235.0, 156.0, 98.0, 46.0, 39.0, 20.0, 12.0, 7.0, 8.0, 7.0, 8.0, 2.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0660400390625, -0.06406974792480469, -0.062099456787109375, -0.06012916564941406, -0.05815887451171875, -0.05618858337402344, -0.054218292236328125, -0.05224800109863281, -0.0502777099609375, -0.04830741882324219, -0.046337127685546875, -0.04436683654785156, -0.04239654541015625, -0.04042625427246094, -0.038455963134765625, -0.03648567199707031, -0.034515380859375, -0.03254508972167969, -0.030574798583984375, -0.028604507446289062, -0.02663421630859375, -0.024663925170898438, -0.022693634033203125, -0.020723342895507812, -0.0187530517578125, -0.016782760620117188, -0.014812469482421875, -0.012842178344726562, -0.01087188720703125, -0.008901596069335938, -0.006931304931640625, -0.0049610137939453125, -0.00299072265625, -0.0010204315185546875, 0.000949859619140625, 0.0029201507568359375, 0.00489044189453125, 0.0068607330322265625, 0.008831024169921875, 0.010801315307617188, 0.0127716064453125, 0.014741897583007812, 0.016712188720703125, 0.018682479858398438, 0.02065277099609375, 0.022623062133789062, 0.024593353271484375, 0.026563644409179688, 0.028533935546875, 0.030504226684570312, 0.032474517822265625, 0.03444480895996094, 0.03641510009765625, 0.03838539123535156, 0.040355682373046875, 0.04232597351074219, 0.0442962646484375, 0.04626655578613281, 0.048236846923828125, 0.05020713806152344, 0.05217742919921875, 0.05414772033691406, 0.056118011474609375, 0.05808830261230469, 0.06005859375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 8.0, 13.0, 13.0, 15.0, 22.0, 29.0, 30.0, 29.0, 46.0, 46.0, 45.0, 60.0, 71.0, 67.0, 63.0, 64.0, 59.0, 54.0, 41.0, 36.0, 31.0, 36.0, 17.0, 22.0, 14.0, 7.0, 9.0, 16.0, 7.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10296630859375, -0.0996084213256836, -0.09625053405761719, -0.09289264678955078, -0.08953475952148438, -0.08617687225341797, -0.08281898498535156, -0.07946109771728516, -0.07610321044921875, -0.07274532318115234, -0.06938743591308594, -0.06602954864501953, -0.06267166137695312, -0.05931377410888672, -0.05595588684082031, -0.052597999572753906, -0.0492401123046875, -0.045882225036621094, -0.04252433776855469, -0.03916645050048828, -0.035808563232421875, -0.03245067596435547, -0.029092788696289062, -0.025734901428222656, -0.02237701416015625, -0.019019126892089844, -0.015661239624023438, -0.012303352355957031, -0.008945465087890625, -0.005587577819824219, -0.0022296905517578125, 0.0011281967163085938, 0.004486083984375, 0.007843971252441406, 0.011201858520507812, 0.014559745788574219, 0.017917633056640625, 0.02127552032470703, 0.024633407592773438, 0.027991294860839844, 0.03134918212890625, 0.034707069396972656, 0.03806495666503906, 0.04142284393310547, 0.044780731201171875, 0.04813861846923828, 0.05149650573730469, 0.054854393005371094, 0.0582122802734375, 0.061570167541503906, 0.06492805480957031, 0.06828594207763672, 0.07164382934570312, 0.07500171661376953, 0.07835960388183594, 0.08171749114990234, 0.08507537841796875, 0.08843326568603516, 0.09179115295410156, 0.09514904022216797, 0.09850692749023438, 0.10186481475830078, 0.10522270202636719, 0.1085805892944336, 0.1119384765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 2.0, 3.0, 4.0, 8.0, 6.0, 8.0, 16.0, 11.0, 17.0, 31.0, 52.0, 102.0, 173.0, 479.0, 1322.0, 5006.0, 43760.0, 918445.0, 69897.0, 6710.0, 1501.0, 522.0, 200.0, 109.0, 42.0, 27.0, 20.0, 20.0, 12.0, 10.0, 7.0, 2.0, 6.0, 5.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.049346923828125, -0.04755735397338867, -0.045767784118652344, -0.043978214263916016, -0.04218864440917969, -0.04039907455444336, -0.03860950469970703, -0.0368199348449707, -0.035030364990234375, -0.03324079513549805, -0.03145122528076172, -0.02966165542602539, -0.027872085571289062, -0.026082515716552734, -0.024292945861816406, -0.022503376007080078, -0.02071380615234375, -0.018924236297607422, -0.017134666442871094, -0.015345096588134766, -0.013555526733398438, -0.01176595687866211, -0.009976387023925781, -0.008186817169189453, -0.006397247314453125, -0.004607677459716797, -0.0028181076049804688, -0.0010285377502441406, 0.0007610321044921875, 0.0025506019592285156, 0.004340171813964844, 0.006129741668701172, 0.0079193115234375, 0.009708881378173828, 0.011498451232910156, 0.013288021087646484, 0.015077590942382812, 0.01686716079711914, 0.01865673065185547, 0.020446300506591797, 0.022235870361328125, 0.024025440216064453, 0.02581501007080078, 0.02760457992553711, 0.029394149780273438, 0.031183719635009766, 0.032973289489746094, 0.03476285934448242, 0.03655242919921875, 0.03834199905395508, 0.040131568908691406, 0.041921138763427734, 0.04371070861816406, 0.04550027847290039, 0.04728984832763672, 0.04907941818237305, 0.050868988037109375, 0.0526585578918457, 0.05444812774658203, 0.05623769760131836, 0.05802726745605469, 0.059816837310791016, 0.061606407165527344, 0.06339597702026367, 0.065185546875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 2.0, 5.0, 6.0, 6.0, 9.0, 5.0, 12.0, 9.0, 16.0, 9.0, 15.0, 20.0, 18.0, 24.0, 25.0, 38.0, 45.0, 46.0, 81.0, 80.0, 108.0, 86.0, 53.0, 41.0, 41.0, 35.0, 28.0, 21.0, 19.0, 10.0, 17.0, 12.0, 10.0, 2.0, 6.0, 6.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 0.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.427267074584961e-05, -3.3200718462467194e-05, -3.212876617908478e-05, -3.105681389570236e-05, -2.9984861612319946e-05, -2.891290932893753e-05, -2.7840957045555115e-05, -2.67690047621727e-05, -2.5697052478790283e-05, -2.4625100195407867e-05, -2.355314791202545e-05, -2.2481195628643036e-05, -2.140924334526062e-05, -2.0337291061878204e-05, -1.926533877849579e-05, -1.8193386495113373e-05, -1.7121434211730957e-05, -1.604948192834854e-05, -1.4977529644966125e-05, -1.390557736158371e-05, -1.2833625078201294e-05, -1.1761672794818878e-05, -1.0689720511436462e-05, -9.617768228054047e-06, -8.545815944671631e-06, -7.473863661289215e-06, -6.401911377906799e-06, -5.3299590945243835e-06, -4.258006811141968e-06, -3.186054527759552e-06, -2.1141022443771362e-06, -1.0421499609947205e-06, 2.9802322387695312e-08, 1.101754605770111e-06, 2.173706889152527e-06, 3.2456591725349426e-06, 4.317611455917358e-06, 5.389563739299774e-06, 6.46151602268219e-06, 7.533468306064606e-06, 8.605420589447021e-06, 9.677372872829437e-06, 1.0749325156211853e-05, 1.1821277439594269e-05, 1.2893229722976685e-05, 1.39651820063591e-05, 1.5037134289741516e-05, 1.6109086573123932e-05, 1.7181038856506348e-05, 1.8252991139888763e-05, 1.932494342327118e-05, 2.0396895706653595e-05, 2.146884799003601e-05, 2.2540800273418427e-05, 2.3612752556800842e-05, 2.4684704840183258e-05, 2.5756657123565674e-05, 2.682860940694809e-05, 2.7900561690330505e-05, 2.897251397371292e-05, 3.0044466257095337e-05, 3.111641854047775e-05, 3.218837082386017e-05, 3.3260323107242584e-05, 3.4332275390625e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 6.0, 1.0, 6.0, 2.0, 13.0, 17.0, 26.0, 46.0, 56.0, 84.0, 152.0, 307.0, 691.0, 1775.0, 6424.0, 40278.0, 832831.0, 147817.0, 13082.0, 2893.0, 1065.0, 467.0, 214.0, 115.0, 66.0, 41.0, 25.0, 19.0, 18.0, 7.0, 5.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.049072265625, -0.047837018966674805, -0.04660177230834961, -0.045366525650024414, -0.04413127899169922, -0.04289603233337402, -0.04166078567504883, -0.04042553901672363, -0.03919029235839844, -0.03795504570007324, -0.03671979904174805, -0.03548455238342285, -0.034249305725097656, -0.03301405906677246, -0.031778812408447266, -0.03054356575012207, -0.029308319091796875, -0.02807307243347168, -0.026837825775146484, -0.02560257911682129, -0.024367332458496094, -0.0231320858001709, -0.021896839141845703, -0.020661592483520508, -0.019426345825195312, -0.018191099166870117, -0.016955852508544922, -0.015720605850219727, -0.014485359191894531, -0.013250112533569336, -0.01201486587524414, -0.010779619216918945, -0.00954437255859375, -0.008309125900268555, -0.007073879241943359, -0.005838632583618164, -0.004603385925292969, -0.0033681392669677734, -0.002132892608642578, -0.0008976459503173828, 0.0003376007080078125, 0.0015728473663330078, 0.002808094024658203, 0.0040433406829833984, 0.005278587341308594, 0.006513833999633789, 0.007749080657958984, 0.00898432731628418, 0.010219573974609375, 0.01145482063293457, 0.012690067291259766, 0.013925313949584961, 0.015160560607910156, 0.01639580726623535, 0.017631053924560547, 0.018866300582885742, 0.020101547241210938, 0.021336793899536133, 0.022572040557861328, 0.023807287216186523, 0.02504253387451172, 0.026277780532836914, 0.02751302719116211, 0.028748273849487305, 0.0299835205078125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 7.0, 13.0, 8.0, 7.0, 13.0, 21.0, 27.0, 25.0, 30.0, 57.0, 96.0, 82.0, 128.0, 104.0, 97.0, 68.0, 61.0, 33.0, 34.0, 25.0, 16.0, 8.0, 12.0, 8.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038604736328125, -0.03752279281616211, -0.03644084930419922, -0.03535890579223633, -0.03427696228027344, -0.03319501876831055, -0.032113075256347656, -0.031031131744384766, -0.029949188232421875, -0.028867244720458984, -0.027785301208496094, -0.026703357696533203, -0.025621414184570312, -0.024539470672607422, -0.02345752716064453, -0.02237558364868164, -0.02129364013671875, -0.02021169662475586, -0.01912975311279297, -0.018047809600830078, -0.016965866088867188, -0.015883922576904297, -0.014801979064941406, -0.013720035552978516, -0.012638092041015625, -0.011556148529052734, -0.010474205017089844, -0.009392261505126953, -0.008310317993164062, -0.007228374481201172, -0.006146430969238281, -0.005064487457275391, -0.0039825439453125, -0.0029006004333496094, -0.0018186569213867188, -0.0007367134094238281, 0.0003452301025390625, 0.0014271736145019531, 0.0025091171264648438, 0.0035910606384277344, 0.004673004150390625, 0.005754947662353516, 0.006836891174316406, 0.007918834686279297, 0.009000778198242188, 0.010082721710205078, 0.011164665222167969, 0.01224660873413086, 0.01332855224609375, 0.01441049575805664, 0.015492439270019531, 0.016574382781982422, 0.017656326293945312, 0.018738269805908203, 0.019820213317871094, 0.020902156829833984, 0.021984100341796875, 0.023066043853759766, 0.024147987365722656, 0.025229930877685547, 0.026311874389648438, 0.027393817901611328, 0.02847576141357422, 0.02955770492553711, 0.0306396484375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 2.0, 2.0, 8.0, 7.0, 6.0, 17.0, 10.0, 21.0, 32.0, 55.0, 51.0, 107.0, 122.0, 131.0, 109.0, 102.0, 56.0, 36.0, 23.0, 19.0, 22.0, 12.0, 15.0, 9.0, 5.0, 4.0, 1.0, 6.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45653796195983887, -0.44032391905784607, -0.42410987615585327, -0.4078958034515381, -0.3916817605495453, -0.3754677176475525, -0.3592536747455597, -0.3430396318435669, -0.3268255591392517, -0.3106115162372589, -0.2943974733352661, -0.2781834006309509, -0.26196935772895813, -0.24575531482696533, -0.22954127192497253, -0.21332722902297974, -0.19711318612098694, -0.18089914321899414, -0.16468508541584015, -0.14847104251384735, -0.13225698471069336, -0.11604294180870056, -0.09982889890670776, -0.08361484855413437, -0.06740079820156097, -0.05118674784898758, -0.03497270122170448, -0.018758654594421387, -0.002544604241847992, 0.013669446110725403, 0.0298834890127182, 0.046097539365291595, 0.06231158971786499, 0.07852564007043839, 0.09473969042301178, 0.11095373332500458, 0.12716779112815857, 0.14338183403015137, 0.15959587693214417, 0.17580991983413696, 0.19202397763729095, 0.20823802053928375, 0.22445207834243774, 0.24066612124443054, 0.25688016414642334, 0.2730942368507385, 0.28930824995040894, 0.3055223226547241, 0.3217363655567169, 0.3379504084587097, 0.3541644513607025, 0.3703784942626953, 0.3865925669670105, 0.4028066098690033, 0.4190206527709961, 0.4352346956729889, 0.4514487385749817, 0.4676627814769745, 0.4838768243789673, 0.5000908970832825, 0.5163049101829529, 0.5325189828872681, 0.5487329959869385, 0.5649470686912537, 0.5811611413955688]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 9.0, 8.0, 13.0, 16.0, 29.0, 28.0, 29.0, 41.0, 44.0, 61.0, 93.0, 90.0, 105.0, 85.0, 74.0, 54.0, 55.0, 54.0, 31.0, 24.0, 22.0, 13.0, 7.0, 11.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0288023948669434, -1.0037733316421509, -0.9787443280220032, -0.9537153244018555, -0.9286863207817078, -0.9036572575569153, -0.8786282539367676, -0.8535991907119751, -0.8285701870918274, -0.8035411834716797, -0.7785121202468872, -0.7534831166267395, -0.7284541130065918, -0.7034250497817993, -0.6783960461616516, -0.6533670425415039, -0.6283379793167114, -0.6033089756965637, -0.5782799124717712, -0.5532509088516235, -0.5282219052314758, -0.5031928420066833, -0.47816383838653564, -0.45313480496406555, -0.42810583114624023, -0.40307679772377014, -0.37804779410362244, -0.35301876068115234, -0.32798972725868225, -0.30296069383621216, -0.27793169021606445, -0.25290265679359436, -0.22787362337112427, -0.20284460484981537, -0.17781557142734528, -0.15278655290603638, -0.12775751948356628, -0.10272850096225739, -0.07769948244094849, -0.052670449018478394, -0.027641430497169495, -0.002612406387925148, 0.0224166177213192, 0.047445639967918396, 0.07247466593980789, 0.09750369191169739, 0.12253271043300629, 0.14756174385547638, 0.17259076237678528, 0.19761978089809418, 0.22264881432056427, 0.24767783284187317, 0.27270686626434326, 0.29773586988449097, 0.32276490330696106, 0.34779393672943115, 0.37282294034957886, 0.39785197377204895, 0.42288097739219666, 0.44791001081466675, 0.47293904423713684, 0.49796807765960693, 0.5229970812797546, 0.5480260848999023, 0.5730551481246948]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 13.0, 14.0, 30.0, 35.0, 40.0, 79.0, 444.0, 132.0, 61.0, 42.0, 28.0, 17.0, 14.0, 12.0, 10.0, 5.0, 3.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06904792785644531, -0.06686782836914062, -0.06468772888183594, -0.06250762939453125, -0.06032752990722656, -0.058147430419921875, -0.05596733093261719, -0.0537872314453125, -0.05160713195800781, -0.049427032470703125, -0.04724693298339844, -0.04506683349609375, -0.04288673400878906, -0.040706634521484375, -0.03852653503417969, -0.036346435546875, -0.03416633605957031, -0.031986236572265625, -0.029806137084960938, -0.02762603759765625, -0.025445938110351562, -0.023265838623046875, -0.021085739135742188, -0.0189056396484375, -0.016725540161132812, -0.014545440673828125, -0.012365341186523438, -0.01018524169921875, -0.008005142211914062, -0.005825042724609375, -0.0036449432373046875, -0.00146484375, 0.0007152557373046875, 0.002895355224609375, 0.0050754547119140625, 0.00725555419921875, 0.009435653686523438, 0.011615753173828125, 0.013795852661132812, 0.0159759521484375, 0.018156051635742188, 0.020336151123046875, 0.022516250610351562, 0.02469635009765625, 0.026876449584960938, 0.029056549072265625, 0.031236648559570312, 0.033416748046875, 0.03559684753417969, 0.037776947021484375, 0.03995704650878906, 0.04213714599609375, 0.04431724548339844, 0.046497344970703125, 0.04867744445800781, 0.0508575439453125, 0.05303764343261719, 0.055217742919921875, 0.05739784240722656, 0.05957794189453125, 0.06175804138183594, 0.06393814086914062, 0.06611824035644531, 0.06829833984375]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 5.0, 8.0, 7.0, 13.0, 15.0, 23.0, 36.0, 59.0, 73.0, 156.0, 292.0, 658.0, 2409.0, 17375.0, 8340027.0, 22809.0, 3014.0, 856.0, 309.0, 187.0, 86.0, 57.0, 35.0, 16.0, 24.0, 10.0, 5.0, 5.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1359749436378479, -0.12994161248207092, -0.12390827387571335, -0.11787494271993637, -0.1118416041135788, -0.10580827295780182, -0.09977494180202484, -0.09374161064624786, -0.08770827203989029, -0.08167494088411331, -0.07564160227775574, -0.06960827112197876, -0.06357493996620178, -0.05754160135984421, -0.05150827020406723, -0.045474935322999954, -0.03944160044193268, -0.0334082655608654, -0.027374932542443275, -0.02134159952402115, -0.015308264642953873, -0.009274929761886597, -0.003241598606109619, 0.002791736274957657, 0.008825071156024933, 0.014858405105769634, 0.020891739055514336, 0.026925072073936462, 0.03295840695500374, 0.038991741836071014, 0.04502507299184799, 0.05105840787291527, 0.057091742753982544, 0.06312507390975952, 0.0691584125161171, 0.07519174367189407, 0.08122508227825165, 0.08725841343402863, 0.0932917445898056, 0.09932507574558258, 0.10535841435194016, 0.11139174550771713, 0.11742508411407471, 0.12345841526985168, 0.12949174642562866, 0.13552507758140564, 0.14155840873718262, 0.1475917547941208, 0.15362508594989777, 0.15965841710567474, 0.16569174826145172, 0.1717250943183899, 0.17775842547416687, 0.18379175662994385, 0.18982508778572083, 0.1958584189414978, 0.20189175009727478, 0.20792508125305176, 0.21395841240882874, 0.2199917435646057, 0.22602508962154388, 0.23205842077732086, 0.23809175193309784, 0.24412508308887482, 0.250158429145813]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 5.0, 2.0, 5.0, 2.0, 5.0, 4.0, 10.0, 6.0, 3.0, 6.0, 7.0, 7.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.19189268350601196, -0.18177467584609985, -0.17165666818618774, -0.16153866052627563, -0.15142063796520233, -0.14130263030529022, -0.1311846226453781, -0.1210666075348854, -0.1109485998749733, -0.10083059221506119, -0.09071257710456848, -0.08059456944465637, -0.07047656178474426, -0.060358546674251556, -0.05024053901433945, -0.04012252390384674, -0.03000451624393463, -0.019886504858732224, -0.009768495336174965, 0.0003495141863822937, 0.010467525571584702, 0.02058553695678711, 0.03070354461669922, 0.040821559727191925, 0.050939567387104034, 0.06105757877230644, 0.07117559015750885, 0.08129359781742096, 0.09141160547733307, 0.10152962058782578, 0.11164762824773788, 0.12176564335823059, 0.1318836510181427, 0.1420016586780548, 0.15211966633796692, 0.16223767399787903, 0.17235569655895233, 0.18247370421886444, 0.19259171187877655, 0.20270973443984985, 0.21282774209976196, 0.22294574975967407, 0.23306375741958618, 0.2431817650794983, 0.2532997727394104, 0.2634177803993225, 0.2735357880592346, 0.2836538255214691, 0.29377180337905884, 0.30388981103897095, 0.31400781869888306, 0.32412582635879517, 0.3342438340187073, 0.3443618416786194, 0.3544798493385315, 0.364597886800766, 0.3747158944606781, 0.3848339021205902, 0.3949519097805023, 0.40506991744041443, 0.41518792510032654, 0.42530596256256104, 0.43542397022247314, 0.44554197788238525, 0.45565998554229736]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 12.0, 10.0, 19.0, 31.0, 45.0, 72.0, 125.0, 163.0, 162.0, 127.0, 82.0, 61.0, 38.0, 26.0, 18.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.050994873046875, -0.04978203773498535, -0.0485692024230957, -0.047356367111206055, -0.046143531799316406, -0.04493069648742676, -0.04371786117553711, -0.04250502586364746, -0.04129219055175781, -0.040079355239868164, -0.038866519927978516, -0.03765368461608887, -0.03644084930419922, -0.03522801399230957, -0.03401517868041992, -0.03280234336853027, -0.031589508056640625, -0.030376672744750977, -0.029163837432861328, -0.02795100212097168, -0.02673816680908203, -0.025525331497192383, -0.024312496185302734, -0.023099660873413086, -0.021886825561523438, -0.02067399024963379, -0.01946115493774414, -0.018248319625854492, -0.017035484313964844, -0.015822649002075195, -0.014609813690185547, -0.013396978378295898, -0.01218414306640625, -0.010971307754516602, -0.009758472442626953, -0.008545637130737305, -0.007332801818847656, -0.006119966506958008, -0.004907131195068359, -0.003694295883178711, -0.0024814605712890625, -0.001268625259399414, -5.5789947509765625e-05, 0.0011570453643798828, 0.0023698806762695312, 0.0035827159881591797, 0.004795551300048828, 0.0060083866119384766, 0.007221221923828125, 0.008434057235717773, 0.009646892547607422, 0.01085972785949707, 0.012072563171386719, 0.013285398483276367, 0.014498233795166016, 0.015711069107055664, 0.016923904418945312, 0.01813673973083496, 0.01934957504272461, 0.020562410354614258, 0.021775245666503906, 0.022988080978393555, 0.024200916290283203, 0.02541375160217285, 0.0266265869140625]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 8.0, 9.0, 8.0, 14.0, 27.0, 28.0, 48.0, 65.0, 131.0, 249.0, 477.0, 1026.0, 2672.0, 8834.0, 40009.0, 297428.0, 142722.0, 21192.0, 5557.0, 1966.0, 881.0, 368.0, 193.0, 135.0, 70.0, 49.0, 26.0, 20.0, 14.0, 8.0, 5.0, 4.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.487060546875, -0.4748268127441406, -0.46259307861328125, -0.4503593444824219, -0.4381256103515625, -0.4258918762207031, -0.41365814208984375, -0.4014244079589844, -0.389190673828125, -0.3769569396972656, -0.36472320556640625, -0.3524894714355469, -0.3402557373046875, -0.3280220031738281, -0.31578826904296875, -0.3035545349121094, -0.29132080078125, -0.2790870666503906, -0.26685333251953125, -0.2546195983886719, -0.2423858642578125, -0.23015213012695312, -0.21791839599609375, -0.20568466186523438, -0.193450927734375, -0.18121719360351562, -0.16898345947265625, -0.15674972534179688, -0.1445159912109375, -0.13228225708007812, -0.12004852294921875, -0.10781478881835938, -0.0955810546875, -0.08334732055664062, -0.07111358642578125, -0.058879852294921875, -0.0466461181640625, -0.034412384033203125, -0.02217864990234375, -0.009944915771484375, 0.002288818359375, 0.014522552490234375, 0.02675628662109375, 0.038990020751953125, 0.0512237548828125, 0.06345748901367188, 0.07569122314453125, 0.08792495727539062, 0.10015869140625, 0.11239242553710938, 0.12462615966796875, 0.13685989379882812, 0.1490936279296875, 0.16132736206054688, 0.17356109619140625, 0.18579483032226562, 0.198028564453125, 0.21026229858398438, 0.22249603271484375, 0.23472976684570312, 0.2469635009765625, 0.2591972351074219, 0.27143096923828125, 0.2836647033691406, 0.2958984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 4.0, 3.0, 5.0, 15.0, 14.0, 18.0, 21.0, 46.0, 42.0, 67.0, 98.0, 104.0, 127.0, 99.0, 88.0, 68.0, 56.0, 45.0, 36.0, 18.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.0924072265625, -0.09011220932006836, -0.08781719207763672, -0.08552217483520508, -0.08322715759277344, -0.0809321403503418, -0.07863712310791016, -0.07634210586547852, -0.07404708862304688, -0.07175207138061523, -0.0694570541381836, -0.06716203689575195, -0.06486701965332031, -0.06257200241088867, -0.06027698516845703, -0.05798196792602539, -0.05568695068359375, -0.05339193344116211, -0.05109691619873047, -0.04880189895629883, -0.04650688171386719, -0.04421186447143555, -0.041916847229003906, -0.039621829986572266, -0.037326812744140625, -0.035031795501708984, -0.032736778259277344, -0.030441761016845703, -0.028146743774414062, -0.025851726531982422, -0.02355670928955078, -0.02126169204711914, -0.0189666748046875, -0.01667165756225586, -0.014376640319824219, -0.012081623077392578, -0.009786605834960938, -0.007491588592529297, -0.005196571350097656, -0.0029015541076660156, -0.000606536865234375, 0.0016884803771972656, 0.003983497619628906, 0.006278514862060547, 0.008573532104492188, 0.010868549346923828, 0.013163566589355469, 0.01545858383178711, 0.01775360107421875, 0.02004861831665039, 0.02234363555908203, 0.024638652801513672, 0.026933670043945312, 0.029228687286376953, 0.031523704528808594, 0.033818721771240234, 0.036113739013671875, 0.038408756256103516, 0.040703773498535156, 0.0429987907409668, 0.04529380798339844, 0.04758882522583008, 0.04988384246826172, 0.05217885971069336, 0.054473876953125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 8.0, 8.0, 12.0, 11.0, 20.0, 24.0, 21.0, 26.0, 33.0, 34.0, 41.0, 40.0, 31.0, 20.0, 26.0, 24.0, 20.0, 19.0, 12.0, 11.0, 10.0, 4.0, 9.0, 3.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.15863895416259766, -0.15479515492916107, -0.15095137059688568, -0.1471075713634491, -0.1432637870311737, -0.13941998779773712, -0.13557620346546173, -0.13173240423202515, -0.12788861989974976, -0.12404482811689377, -0.12020103633403778, -0.1163572445511818, -0.1125134527683258, -0.10866965353488922, -0.10482586175203323, -0.10098206996917725, -0.09713827073574066, -0.09329447895288467, -0.08945068717002869, -0.0856068953871727, -0.08176310360431671, -0.07791930437088013, -0.07407551258802414, -0.07023172080516815, -0.06638792902231216, -0.06254413723945618, -0.05870034545660019, -0.0548565499484539, -0.051012758165597916, -0.04716896638274193, -0.04332517087459564, -0.039481379091739655, -0.03563758730888367, -0.03179379552602768, -0.027950001880526543, -0.024106208235025406, -0.02026241645216942, -0.01641862466931343, -0.012574831023812294, -0.008731037378311157, -0.00488724559545517, -0.0010434528812766075, 0.0028003398329019547, 0.006644132547080517, 0.010487925261259079, 0.014331717044115067, 0.018175510689616203, 0.02201930433511734, 0.025863096117973328, 0.029706887900829315, 0.0335506796836853, 0.03739447519183159, 0.041238266974687576, 0.045082058757543564, 0.04892585426568985, 0.05276964604854584, 0.056613437831401825, 0.06045722961425781, 0.0643010213971138, 0.06814481317996979, 0.07198861241340637, 0.07583239674568176, 0.07967619597911835, 0.08351998776197433, 0.08736377954483032]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 6.0, 10.0, 10.0, 16.0, 13.0, 23.0, 24.0, 26.0, 26.0, 31.0, 36.0, 32.0, 27.0, 42.0, 21.0, 16.0, 19.0, 15.0, 16.0, 11.0, 9.0, 8.0, 8.0, 9.0, 4.0, 6.0, 1.0, 2.0, 6.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2629207372665405, -0.2546846270561218, -0.24644850194454193, -0.23821239173412323, -0.22997626662254333, -0.22174015641212463, -0.21350404620170593, -0.20526793599128723, -0.19703181087970734, -0.18879570066928864, -0.18055957555770874, -0.17232346534729004, -0.16408735513687134, -0.15585123002529144, -0.14761511981487274, -0.13937899470329285, -0.13114288449287415, -0.12290676683187485, -0.11467064917087555, -0.10643453896045685, -0.09819842129945755, -0.08996230363845825, -0.08172619342803955, -0.07349007576704025, -0.06525395810604095, -0.057017840445041656, -0.04878172650933266, -0.04054561257362366, -0.03230949491262436, -0.02407337725162506, -0.01583726331591606, -0.007601149380207062, 0.0006349682807922363, 0.008871084079146385, 0.017107199877500534, 0.025343315675854683, 0.03357943147420883, 0.04181554913520813, 0.05005166307091713, 0.05828777700662613, 0.06652389466762543, 0.07476001232862473, 0.08299612998962402, 0.09123224020004272, 0.09946835786104202, 0.10770447552204132, 0.11594058573246002, 0.12417670339345932, 0.13241282105445862, 0.14064893126487732, 0.14888505637645721, 0.15712116658687592, 0.1653572916984558, 0.1735934019088745, 0.1818295121192932, 0.19006562232971191, 0.1983017474412918, 0.2065378576517105, 0.2147739827632904, 0.2230100929737091, 0.2312462031841278, 0.2394823282957077, 0.2477184385061264, 0.2559545636177063, 0.264190673828125]}, "eval/loss": 4.254786491394043, "eval/bleu": 4.614693226090912e-15, "eval/runtime": 2559.2675, "eval/samples_per_second": 5.767, "eval/steps_per_second": 0.721} \ No newline at end of file +{"train/loss": 4.0396, "train/learning_rate": 0.00018623309263299647, "train/epoch": 1.39, "train/global_step": 4500, "_runtime": 42345, "_timestamp": 1651716434, "_step": 4508, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 132.0, 854.0, 28.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.91638946533203, -36.24909591674805, -35.58180618286133, -34.914512634277344, -34.24721908569336, -33.579925537109375, -32.912635803222656, -32.24534225463867, -31.57805061340332, -30.91075897216797, -30.243465423583984, -29.576173782348633, -28.90888023376465, -28.241588592529297, -27.574295043945312, -26.90700340270996, -26.23971176147461, -25.572420120239258, -24.905126571655273, -24.237834930419922, -23.570541381835938, -22.903249740600586, -22.235958099365234, -21.56866455078125, -20.901371002197266, -20.234079360961914, -19.56678581237793, -18.899494171142578, -18.232200622558594, -17.564908981323242, -16.89761734008789, -16.230323791503906, -15.563033103942871, -14.895740509033203, -14.228447914123535, -13.561155319213867, -12.893863677978516, -12.226571083068848, -11.55927848815918, -10.891986846923828, -10.224693298339844, -9.557400703430176, -8.890108108520508, -8.222816467285156, -7.555523872375488, -6.88823127746582, -6.220938682556152, -5.553646564483643, -4.886354446411133, -4.219061851501465, -3.551769733428955, -2.884477138519287, -2.2171847820281982, -1.5498924255371094, -0.8825998306274414, -0.21530771255493164, 0.45198488235473633, 1.1192772388458252, 1.7865697145462036, 2.453862190246582, 3.121154546737671, 3.7884469032287598, 4.455739498138428, 5.1230316162109375, 5.7903242111206055]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 5.0, 4.0, 4.0, 8.0, 12.0, 14.0, 22.0, 22.0, 21.0, 28.0, 36.0, 40.0, 41.0, 66.0, 46.0, 66.0, 55.0, 72.0, 52.0, 63.0, 52.0, 50.0, 39.0, 28.0, 46.0, 35.0, 22.0, 22.0, 14.0, 10.0, 9.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4424476623535156, -2.321978807449341, -2.201509952545166, -2.0810413360595703, -1.9605724811553955, -1.8401036262512207, -1.719634771347046, -1.599165916442871, -1.4786971807479858, -1.358228325843811, -1.2377595901489258, -1.117290735244751, -0.996821939945221, -0.8763531446456909, -0.7558842897415161, -0.6354154944419861, -0.514946699142456, -0.394477903842926, -0.2740090787410736, -0.1535402536392212, -0.03307145833969116, 0.08739733695983887, 0.20786619186401367, 0.3283349871635437, 0.44880378246307373, 0.5692725777626038, 0.6897413730621338, 0.8102102279663086, 0.9306790232658386, 1.0511478185653687, 1.1716166734695435, 1.2920854091644287, 1.4125542640686035, 1.5330231189727783, 1.6534918546676636, 1.7739607095718384, 1.8944294452667236, 2.0148983001708984, 2.1353671550750732, 2.255836009979248, 2.3763046264648438, 2.4967734813690186, 2.6172423362731934, 2.737710952758789, 2.858179807662964, 2.9786486625671387, 3.0991175174713135, 3.2195863723754883, 3.340055227279663, 3.460524082183838, 3.5809929370880127, 3.7014617919921875, 3.821930408477783, 3.942399263381958, 4.062868118286133, 4.1833367347717285, 4.303805828094482, 4.424274444580078, 4.544743537902832, 4.665212154388428, 4.785681247711182, 4.906149864196777, 5.026618957519531, 5.147087574005127, 5.267556190490723]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 10.0, 12.0, 13.0, 32.0, 51.0, 85.0, 135.0, 263.0, 454.0, 835.0, 1586.0, 2992.0, 6175.0, 13390.0, 30167.0, 69830.0, 196738.0, 2490394.0, 1116467.0, 156262.0, 60251.0, 25884.0, 11364.0, 5408.0, 2577.0, 1338.0, 696.0, 364.0, 209.0, 112.0, 85.0, 45.0, 21.0, 12.0, 7.0, 8.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.052734375, -1.9921722412109375, -1.931610107421875, -1.8710479736328125, -1.81048583984375, -1.7499237060546875, -1.689361572265625, -1.6287994384765625, -1.5682373046875, -1.5076751708984375, -1.447113037109375, -1.3865509033203125, -1.32598876953125, -1.2654266357421875, -1.204864501953125, -1.1443023681640625, -1.083740234375, -1.0231781005859375, -0.962615966796875, -0.9020538330078125, -0.84149169921875, -0.7809295654296875, -0.720367431640625, -0.6598052978515625, -0.5992431640625, -0.5386810302734375, -0.478118896484375, -0.4175567626953125, -0.35699462890625, -0.2964324951171875, -0.235870361328125, -0.1753082275390625, -0.11474609375, -0.0541839599609375, 0.006378173828125, 0.0669403076171875, 0.12750244140625, 0.1880645751953125, 0.248626708984375, 0.3091888427734375, 0.3697509765625, 0.4303131103515625, 0.490875244140625, 0.5514373779296875, 0.61199951171875, 0.6725616455078125, 0.733123779296875, 0.7936859130859375, 0.854248046875, 0.9148101806640625, 0.975372314453125, 1.0359344482421875, 1.09649658203125, 1.1570587158203125, 1.217620849609375, 1.2781829833984375, 1.3387451171875, 1.3993072509765625, 1.459869384765625, 1.5204315185546875, 1.58099365234375, 1.6415557861328125, 1.702117919921875, 1.7626800537109375, 1.8232421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 2.0, 2.0, 13.0, 11.0, 15.0, 26.0, 21.0, 21.0, 32.0, 42.0, 48.0, 50.0, 71.0, 56.0, 78.0, 68.0, 57.0, 59.0, 50.0, 54.0, 47.0, 30.0, 38.0, 32.0, 16.0, 23.0, 16.0, 7.0, 5.0, 5.0, 3.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.904296875, -2.794891357421875, -2.68548583984375, -2.576080322265625, -2.4666748046875, -2.357269287109375, -2.24786376953125, -2.138458251953125, -2.029052734375, -1.919647216796875, -1.81024169921875, -1.700836181640625, -1.5914306640625, -1.482025146484375, -1.37261962890625, -1.263214111328125, -1.15380859375, -1.044403076171875, -0.93499755859375, -0.825592041015625, -0.7161865234375, -0.606781005859375, -0.49737548828125, -0.387969970703125, -0.278564453125, -0.169158935546875, -0.05975341796875, 0.049652099609375, 0.1590576171875, 0.268463134765625, 0.37786865234375, 0.487274169921875, 0.5966796875, 0.706085205078125, 0.81549072265625, 0.924896240234375, 1.0343017578125, 1.143707275390625, 1.25311279296875, 1.362518310546875, 1.471923828125, 1.581329345703125, 1.69073486328125, 1.800140380859375, 1.9095458984375, 2.018951416015625, 2.12835693359375, 2.237762451171875, 2.34716796875, 2.456573486328125, 2.56597900390625, 2.675384521484375, 2.7847900390625, 2.894195556640625, 3.00360107421875, 3.113006591796875, 3.222412109375, 3.331817626953125, 3.44122314453125, 3.550628662109375, 3.6600341796875, 3.769439697265625, 3.87884521484375, 3.988250732421875, 4.09765625]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 3.0, 4.0, 10.0, 10.0, 16.0, 25.0, 35.0, 53.0, 83.0, 207.0, 4789.0, 4188374.0, 355.0, 110.0, 58.0, 45.0, 34.0, 13.0, 22.0, 6.0, 6.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-80.4375, -78.0126953125, -75.587890625, -73.1630859375, -70.73828125, -68.3134765625, -65.888671875, -63.4638671875, -61.0390625, -58.6142578125, -56.189453125, -53.7646484375, -51.33984375, -48.9150390625, -46.490234375, -44.0654296875, -41.640625, -39.2158203125, -36.791015625, -34.3662109375, -31.94140625, -29.5166015625, -27.091796875, -24.6669921875, -22.2421875, -19.8173828125, -17.392578125, -14.9677734375, -12.54296875, -10.1181640625, -7.693359375, -5.2685546875, -2.84375, -0.4189453125, 2.005859375, 4.4306640625, 6.85546875, 9.2802734375, 11.705078125, 14.1298828125, 16.5546875, 18.9794921875, 21.404296875, 23.8291015625, 26.25390625, 28.6787109375, 31.103515625, 33.5283203125, 35.953125, 38.3779296875, 40.802734375, 43.2275390625, 45.65234375, 48.0771484375, 50.501953125, 52.9267578125, 55.3515625, 57.7763671875, 60.201171875, 62.6259765625, 65.05078125, 67.4755859375, 69.900390625, 72.3251953125, 74.75]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 9.0, 8.0, 16.0, 17.0, 27.0, 33.0, 53.0, 87.0, 171.0, 855.0, 2177.0, 276.0, 116.0, 54.0, 46.0, 31.0, 25.0, 17.0, 8.0, 14.0, 6.0, 6.0, 3.0, 7.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.427734375, -1.38470458984375, -1.3416748046875, -1.29864501953125, -1.255615234375, -1.21258544921875, -1.1695556640625, -1.12652587890625, -1.08349609375, -1.04046630859375, -0.9974365234375, -0.95440673828125, -0.911376953125, -0.86834716796875, -0.8253173828125, -0.78228759765625, -0.7392578125, -0.69622802734375, -0.6531982421875, -0.61016845703125, -0.567138671875, -0.52410888671875, -0.4810791015625, -0.43804931640625, -0.39501953125, -0.35198974609375, -0.3089599609375, -0.26593017578125, -0.222900390625, -0.17987060546875, -0.1368408203125, -0.09381103515625, -0.05078125, -0.00775146484375, 0.0352783203125, 0.07830810546875, 0.121337890625, 0.16436767578125, 0.2073974609375, 0.25042724609375, 0.29345703125, 0.33648681640625, 0.3795166015625, 0.42254638671875, 0.465576171875, 0.50860595703125, 0.5516357421875, 0.59466552734375, 0.6376953125, 0.68072509765625, 0.7237548828125, 0.76678466796875, 0.809814453125, 0.85284423828125, 0.8958740234375, 0.93890380859375, 0.98193359375, 1.02496337890625, 1.0679931640625, 1.11102294921875, 1.154052734375, 1.19708251953125, 1.2401123046875, 1.28314208984375, 1.326171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 7.0, 8.0, 7.0, 9.0, 16.0, 22.0, 42.0, 78.0, 77.0, 98.0, 115.0, 139.0, 104.0, 87.0, 58.0, 43.0, 32.0, 24.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0522964000701904, -2.92010498046875, -2.7879137992858887, -2.6557223796844482, -2.523530960083008, -2.3913397789001465, -2.259148359298706, -2.1269569396972656, -1.9947656393051147, -1.8625743389129639, -1.7303829193115234, -1.5981916189193726, -1.4660003185272217, -1.3338088989257812, -1.2016175985336304, -1.0694262981414795, -0.9372348785400391, -0.8050435185432434, -0.6728521585464478, -0.5406608581542969, -0.4084694981575012, -0.27627813816070557, -0.1440868377685547, -0.011895477771759033, 0.12029588222503662, 0.2524872422218323, 0.38467857241630554, 0.5168699026107788, 0.6490612626075745, 0.7812526226043701, 0.913443922996521, 1.0456352233886719, 1.1778268814086914, 1.3100181818008423, 1.4422096014022827, 1.5744009017944336, 1.706592321395874, 1.838783621788025, 1.9709749221801758, 2.103166341781616, 2.2353577613830566, 2.367549180984497, 2.4997403621673584, 2.631931781768799, 2.7641232013702393, 2.8963146209716797, 3.028505802154541, 3.1606972217559814, 3.2928884029388428, 3.425079822540283, 3.5572710037231445, 3.689462423324585, 3.8216538429260254, 3.9538450241088867, 4.086036682128906, 4.218227863311768, 4.350419044494629, 4.48261022567749, 4.61480188369751, 4.746993064880371, 4.879184246063232, 5.011375904083252, 5.143567085266113, 5.275758266448975, 5.407949924468994]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 4.0, 7.0, 4.0, 5.0, 6.0, 12.0, 14.0, 22.0, 15.0, 43.0, 29.0, 26.0, 29.0, 47.0, 50.0, 43.0, 45.0, 53.0, 34.0, 47.0, 58.0, 36.0, 46.0, 44.0, 38.0, 36.0, 38.0, 36.0, 36.0, 19.0, 22.0, 18.0, 14.0, 10.0, 3.0, 8.0, 5.0, 0.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.438009262084961, -2.351890802383423, -2.2657723426818848, -2.1796538829803467, -2.0935354232788086, -2.0074169635772705, -1.921298623085022, -1.8351801633834839, -1.7490617036819458, -1.6629432439804077, -1.5768247842788696, -1.490706443786621, -1.404587984085083, -1.318469524383545, -1.2323510646820068, -1.1462326049804688, -1.0601141452789307, -0.9739956855773926, -0.8878772258758545, -0.8017588257789612, -0.7156403660774231, -0.629521906375885, -0.5434035062789917, -0.4572850465774536, -0.3711665868759155, -0.28504812717437744, -0.19892969727516174, -0.11281126737594604, -0.02669280767440796, 0.05942565202713013, 0.14554405212402344, 0.23166251182556152, 0.3177812099456787, 0.4038996696472168, 0.4900180995464325, 0.5761365294456482, 0.6622549891471863, 0.7483734488487244, 0.8344918489456177, 0.9206103086471558, 1.0067287683486938, 1.092847228050232, 1.17896568775177, 1.2650840282440186, 1.3512024879455566, 1.4373209476470947, 1.5234394073486328, 1.609557867050171, 1.695676326751709, 1.781794786453247, 1.8679132461547852, 1.9540317058563232, 2.0401501655578613, 2.1262686252593994, 2.2123870849609375, 2.2985053062438965, 2.3846240043640137, 2.4707424640655518, 2.55686092376709, 2.642979383468628, 2.729097843170166, 2.815216302871704, 2.901334762573242, 2.987452983856201, 3.0735714435577393]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 13.0, 16.0, 15.0, 13.0, 19.0, 26.0, 34.0, 51.0, 87.0, 107.0, 176.0, 231.0, 350.0, 575.0, 987.0, 1727.0, 3410.0, 7745.0, 19143.0, 53209.0, 160161.0, 399956.0, 261177.0, 87290.0, 29925.0, 11608.0, 4885.0, 2328.0, 1199.0, 706.0, 425.0, 323.0, 198.0, 127.0, 81.0, 55.0, 33.0, 39.0, 24.0, 25.0, 15.0, 4.0, 6.0, 10.0, 7.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.373779296875, -0.3616142272949219, -0.34944915771484375, -0.3372840881347656, -0.3251190185546875, -0.3129539489746094, -0.30078887939453125, -0.2886238098144531, -0.276458740234375, -0.2642936706542969, -0.25212860107421875, -0.23996353149414062, -0.2277984619140625, -0.21563339233398438, -0.20346832275390625, -0.19130325317382812, -0.17913818359375, -0.16697311401367188, -0.15480804443359375, -0.14264297485351562, -0.1304779052734375, -0.11831283569335938, -0.10614776611328125, -0.09398269653320312, -0.081817626953125, -0.06965255737304688, -0.05748748779296875, -0.045322418212890625, -0.0331573486328125, -0.020992279052734375, -0.00882720947265625, 0.003337860107421875, 0.0155029296875, 0.027667999267578125, 0.03983306884765625, 0.051998138427734375, 0.0641632080078125, 0.07632827758789062, 0.08849334716796875, 0.10065841674804688, 0.112823486328125, 0.12498855590820312, 0.13715362548828125, 0.14931869506835938, 0.1614837646484375, 0.17364883422851562, 0.18581390380859375, 0.19797897338867188, 0.21014404296875, 0.22230911254882812, 0.23447418212890625, 0.24663925170898438, 0.2588043212890625, 0.2709693908691406, 0.28313446044921875, 0.2952995300292969, 0.307464599609375, 0.3196296691894531, 0.33179473876953125, 0.3439598083496094, 0.3561248779296875, 0.3682899475097656, 0.38045501708984375, 0.3926200866699219, 0.40478515625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 4.0, 3.0, 5.0, 6.0, 9.0, 11.0, 23.0, 26.0, 28.0, 24.0, 23.0, 38.0, 49.0, 38.0, 31.0, 55.0, 49.0, 48.0, 42.0, 37.0, 35.0, 56.0, 50.0, 23.0, 39.0, 35.0, 42.0, 35.0, 23.0, 23.0, 18.0, 16.0, 10.0, 14.0, 5.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9072265625, -1.8449249267578125, -1.782623291015625, -1.7203216552734375, -1.65802001953125, -1.5957183837890625, -1.533416748046875, -1.4711151123046875, -1.4088134765625, -1.3465118408203125, -1.284210205078125, -1.2219085693359375, -1.15960693359375, -1.0973052978515625, -1.035003662109375, -0.9727020263671875, -0.910400390625, -0.8480987548828125, -0.785797119140625, -0.7234954833984375, -0.66119384765625, -0.5988922119140625, -0.536590576171875, -0.4742889404296875, -0.4119873046875, -0.3496856689453125, -0.287384033203125, -0.2250823974609375, -0.16278076171875, -0.1004791259765625, -0.038177490234375, 0.0241241455078125, 0.08642578125, 0.1487274169921875, 0.211029052734375, 0.2733306884765625, 0.33563232421875, 0.3979339599609375, 0.460235595703125, 0.5225372314453125, 0.5848388671875, 0.6471405029296875, 0.709442138671875, 0.7717437744140625, 0.83404541015625, 0.8963470458984375, 0.958648681640625, 1.0209503173828125, 1.083251953125, 1.1455535888671875, 1.207855224609375, 1.2701568603515625, 1.33245849609375, 1.3947601318359375, 1.457061767578125, 1.5193634033203125, 1.5816650390625, 1.6439666748046875, 1.706268310546875, 1.7685699462890625, 1.83087158203125, 1.8931732177734375, 1.955474853515625, 2.0177764892578125, 2.080078125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 8.0, 6.0, 4.0, 11.0, 20.0, 12.0, 27.0, 42.0, 30.0, 56.0, 70.0, 87.0, 98.0, 148.0, 154.0, 203.0, 302.0, 336.0, 415.0, 804.0, 2427.0, 26081.0, 430114.0, 547936.0, 33229.0, 2965.0, 789.0, 489.0, 348.0, 275.0, 205.0, 190.0, 162.0, 103.0, 89.0, 66.0, 77.0, 53.0, 25.0, 25.0, 18.0, 15.0, 12.0, 14.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.5419921875, -0.5255966186523438, -0.5092010498046875, -0.49280548095703125, -0.476409912109375, -0.46001434326171875, -0.4436187744140625, -0.42722320556640625, -0.41082763671875, -0.39443206787109375, -0.3780364990234375, -0.36164093017578125, -0.345245361328125, -0.32884979248046875, -0.3124542236328125, -0.29605865478515625, -0.2796630859375, -0.26326751708984375, -0.2468719482421875, -0.23047637939453125, -0.214080810546875, -0.19768524169921875, -0.1812896728515625, -0.16489410400390625, -0.14849853515625, -0.13210296630859375, -0.1157073974609375, -0.09931182861328125, -0.082916259765625, -0.06652069091796875, -0.0501251220703125, -0.03372955322265625, -0.017333984375, -0.00093841552734375, 0.0154571533203125, 0.03185272216796875, 0.048248291015625, 0.06464385986328125, 0.0810394287109375, 0.09743499755859375, 0.11383056640625, 0.13022613525390625, 0.1466217041015625, 0.16301727294921875, 0.179412841796875, 0.19580841064453125, 0.2122039794921875, 0.22859954833984375, 0.2449951171875, 0.26139068603515625, 0.2777862548828125, 0.29418182373046875, 0.310577392578125, 0.32697296142578125, 0.3433685302734375, 0.35976409912109375, 0.37615966796875, 0.39255523681640625, 0.4089508056640625, 0.42534637451171875, 0.441741943359375, 0.45813751220703125, 0.4745330810546875, 0.49092864990234375, 0.50732421875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 9.0, 11.0, 10.0, 12.0, 7.0, 12.0, 12.0, 13.0, 20.0, 22.0, 18.0, 24.0, 37.0, 45.0, 32.0, 31.0, 45.0, 57.0, 46.0, 54.0, 39.0, 47.0, 44.0, 35.0, 34.0, 36.0, 33.0, 38.0, 25.0, 33.0, 29.0, 20.0, 12.0, 15.0, 12.0, 15.0, 9.0, 4.0, 1.0, 5.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.33203125, -3.208984375, -3.0859375, -2.962890625, -2.83984375, -2.716796875, -2.59375, -2.470703125, -2.34765625, -2.224609375, -2.1015625, -1.978515625, -1.85546875, -1.732421875, -1.609375, -1.486328125, -1.36328125, -1.240234375, -1.1171875, -0.994140625, -0.87109375, -0.748046875, -0.625, -0.501953125, -0.37890625, -0.255859375, -0.1328125, -0.009765625, 0.11328125, 0.236328125, 0.359375, 0.482421875, 0.60546875, 0.728515625, 0.8515625, 0.974609375, 1.09765625, 1.220703125, 1.34375, 1.466796875, 1.58984375, 1.712890625, 1.8359375, 1.958984375, 2.08203125, 2.205078125, 2.328125, 2.451171875, 2.57421875, 2.697265625, 2.8203125, 2.943359375, 3.06640625, 3.189453125, 3.3125, 3.435546875, 3.55859375, 3.681640625, 3.8046875, 3.927734375, 4.05078125, 4.173828125, 4.296875, 4.419921875, 4.54296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 1.0, 12.0, 10.0, 18.0, 22.0, 48.0, 74.0, 104.0, 220.0, 431.0, 1301.0, 11208.0, 1014973.0, 17526.0, 1597.0, 457.0, 220.0, 130.0, 68.0, 41.0, 23.0, 14.0, 11.0, 7.0, 7.0, 3.0, 8.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1341552734375, -0.1294574737548828, -0.12475967407226562, -0.12006187438964844, -0.11536407470703125, -0.11066627502441406, -0.10596847534179688, -0.10127067565917969, -0.0965728759765625, -0.09187507629394531, -0.08717727661132812, -0.08247947692871094, -0.07778167724609375, -0.07308387756347656, -0.06838607788085938, -0.06368827819824219, -0.058990478515625, -0.05429267883300781, -0.049594879150390625, -0.04489707946777344, -0.04019927978515625, -0.03550148010253906, -0.030803680419921875, -0.026105880737304688, -0.0214080810546875, -0.016710281372070312, -0.012012481689453125, -0.0073146820068359375, -0.00261688232421875, 0.0020809173583984375, 0.006778717041015625, 0.011476516723632812, 0.01617431640625, 0.020872116088867188, 0.025569915771484375, 0.030267715454101562, 0.03496551513671875, 0.03966331481933594, 0.044361114501953125, 0.04905891418457031, 0.0537567138671875, 0.05845451354980469, 0.06315231323242188, 0.06785011291503906, 0.07254791259765625, 0.07724571228027344, 0.08194351196289062, 0.08664131164550781, 0.091339111328125, 0.09603691101074219, 0.10073471069335938, 0.10543251037597656, 0.11013031005859375, 0.11482810974121094, 0.11952590942382812, 0.12422370910644531, 0.1289215087890625, 0.1336193084716797, 0.13831710815429688, 0.14301490783691406, 0.14771270751953125, 0.15241050720214844, 0.15710830688476562, 0.1618061065673828, 0.16650390625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 4.0, 4.0, 4.0, 9.0, 17.0, 12.0, 24.0, 30.0, 44.0, 54.0, 75.0, 84.0, 65.0, 94.0, 80.0, 82.0, 62.0, 70.0, 56.0, 32.0, 25.0, 15.0, 13.0, 10.0, 4.0, 9.0, 5.0, 4.0, 3.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.1054019927978516e-05, -3.0104070901870728e-05, -2.915412187576294e-05, -2.820417284965515e-05, -2.7254223823547363e-05, -2.6304274797439575e-05, -2.5354325771331787e-05, -2.4404376745224e-05, -2.345442771911621e-05, -2.2504478693008423e-05, -2.1554529666900635e-05, -2.0604580640792847e-05, -1.965463161468506e-05, -1.870468258857727e-05, -1.7754733562469482e-05, -1.6804784536361694e-05, -1.5854835510253906e-05, -1.4904886484146118e-05, -1.395493745803833e-05, -1.3004988431930542e-05, -1.2055039405822754e-05, -1.1105090379714966e-05, -1.0155141353607178e-05, -9.20519232749939e-06, -8.255243301391602e-06, -7.3052942752838135e-06, -6.355345249176025e-06, -5.405396223068237e-06, -4.455447196960449e-06, -3.505498170852661e-06, -2.555549144744873e-06, -1.605600118637085e-06, -6.556510925292969e-07, 2.942979335784912e-07, 1.2442469596862793e-06, 2.1941959857940674e-06, 3.1441450119018555e-06, 4.0940940380096436e-06, 5.044043064117432e-06, 5.99399209022522e-06, 6.943941116333008e-06, 7.893890142440796e-06, 8.843839168548584e-06, 9.793788194656372e-06, 1.074373722076416e-05, 1.1693686246871948e-05, 1.2643635272979736e-05, 1.3593584299087524e-05, 1.4543533325195312e-05, 1.54934823513031e-05, 1.644343137741089e-05, 1.7393380403518677e-05, 1.8343329429626465e-05, 1.9293278455734253e-05, 2.024322748184204e-05, 2.119317650794983e-05, 2.2143125534057617e-05, 2.3093074560165405e-05, 2.4043023586273193e-05, 2.499297261238098e-05, 2.594292163848877e-05, 2.6892870664596558e-05, 2.7842819690704346e-05, 2.8792768716812134e-05, 2.9742717742919922e-05]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 4.0, 1.0, 6.0, 3.0, 2.0, 10.0, 13.0, 23.0, 30.0, 74.0, 189.0, 1136.0, 865146.0, 180771.0, 830.0, 138.0, 55.0, 37.0, 23.0, 12.0, 13.0, 4.0, 5.0, 11.0, 2.0, 5.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.64013671875, -0.6232643127441406, -0.6063919067382812, -0.5895195007324219, -0.5726470947265625, -0.5557746887207031, -0.5389022827148438, -0.5220298767089844, -0.505157470703125, -0.4882850646972656, -0.47141265869140625, -0.4545402526855469, -0.4376678466796875, -0.4207954406738281, -0.40392303466796875, -0.3870506286621094, -0.37017822265625, -0.3533058166503906, -0.33643341064453125, -0.3195610046386719, -0.3026885986328125, -0.2858161926269531, -0.26894378662109375, -0.2520713806152344, -0.235198974609375, -0.21832656860351562, -0.20145416259765625, -0.18458175659179688, -0.1677093505859375, -0.15083694458007812, -0.13396453857421875, -0.11709213256835938, -0.1002197265625, -0.08334732055664062, -0.06647491455078125, -0.049602508544921875, -0.0327301025390625, -0.015857696533203125, 0.00101470947265625, 0.017887115478515625, 0.034759521484375, 0.051631927490234375, 0.06850433349609375, 0.08537673950195312, 0.1022491455078125, 0.11912155151367188, 0.13599395751953125, 0.15286636352539062, 0.16973876953125, 0.18661117553710938, 0.20348358154296875, 0.22035598754882812, 0.2372283935546875, 0.2541007995605469, 0.27097320556640625, 0.2878456115722656, 0.304718017578125, 0.3215904235839844, 0.33846282958984375, 0.3553352355957031, 0.3722076416015625, 0.3890800476074219, 0.40595245361328125, 0.4228248596191406, 0.439697265625]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 7.0, 2.0, 5.0, 4.0, 1.0, 9.0, 15.0, 12.0, 24.0, 38.0, 65.0, 85.0, 186.0, 201.0, 135.0, 54.0, 43.0, 26.0, 27.0, 11.0, 11.0, 7.0, 5.0, 11.0, 5.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.039794921875, -0.0386965274810791, -0.0375981330871582, -0.036499738693237305, -0.035401344299316406, -0.03430294990539551, -0.03320455551147461, -0.03210616111755371, -0.031007766723632812, -0.029909372329711914, -0.028810977935791016, -0.027712583541870117, -0.02661418914794922, -0.02551579475402832, -0.024417400360107422, -0.023319005966186523, -0.022220611572265625, -0.021122217178344727, -0.020023822784423828, -0.01892542839050293, -0.01782703399658203, -0.016728639602661133, -0.015630245208740234, -0.014531850814819336, -0.013433456420898438, -0.012335062026977539, -0.01123666763305664, -0.010138273239135742, -0.009039878845214844, -0.007941484451293945, -0.006843090057373047, -0.0057446956634521484, -0.00464630126953125, -0.0035479068756103516, -0.002449512481689453, -0.0013511180877685547, -0.00025272369384765625, 0.0008456707000732422, 0.0019440650939941406, 0.003042459487915039, 0.0041408538818359375, 0.005239248275756836, 0.006337642669677734, 0.007436037063598633, 0.008534431457519531, 0.00963282585144043, 0.010731220245361328, 0.011829614639282227, 0.012928009033203125, 0.014026403427124023, 0.015124797821044922, 0.01622319221496582, 0.01732158660888672, 0.018419981002807617, 0.019518375396728516, 0.020616769790649414, 0.021715164184570312, 0.02281355857849121, 0.02391195297241211, 0.025010347366333008, 0.026108741760253906, 0.027207136154174805, 0.028305530548095703, 0.0294039249420166, 0.0305023193359375]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 12.0, 7.0, 50.0, 171.0, 341.0, 274.0, 94.0, 30.0, 14.0, 7.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.264389991760254, -12.961758613586426, -12.659126281738281, -12.356494903564453, -12.053863525390625, -11.75123119354248, -11.448599815368652, -11.145967483520508, -10.84333610534668, -10.540704727172852, -10.238072395324707, -9.935441017150879, -9.632808685302734, -9.330177307128906, -9.027545928955078, -8.72491455078125, -8.422282218933105, -8.119650840759277, -7.817018508911133, -7.514387130737305, -7.211755275726318, -6.909123420715332, -6.606492042541504, -6.303860187530518, -6.001228332519531, -5.698596477508545, -5.395964622497559, -5.0933332443237305, -4.790701389312744, -4.488069534301758, -4.18543815612793, -3.8828063011169434, -3.580173969268799, -3.2775421142578125, -2.9749104976654053, -2.672278881072998, -2.3696470260620117, -2.0670151710510254, -1.7643835544586182, -1.461751937866211, -1.1591200828552246, -0.8564883470535278, -0.553856611251831, -0.2512248754501343, 0.0514068603515625, 0.3540385961532593, 0.656670331954956, 0.9593019485473633, 1.2619338035583496, 1.5645655393600464, 1.8671972751617432, 2.1698288917541504, 2.4724607467651367, 2.775092601776123, 3.0777242183685303, 3.3803558349609375, 3.682987689971924, 3.98561954498291, 4.288250923156738, 4.590882778167725, 4.893514633178711, 5.196146488189697, 5.498778343200684, 5.801409721374512, 6.104041576385498]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 2.0, 3.0, 11.0, 16.0, 16.0, 14.0, 38.0, 33.0, 29.0, 33.0, 42.0, 57.0, 46.0, 50.0, 43.0, 49.0, 55.0, 58.0, 37.0, 52.0, 42.0, 48.0, 45.0, 34.0, 37.0, 24.0, 21.0, 20.0, 8.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.880835771560669, -1.813689947128296, -1.7465442419052124, -1.6793984174728394, -1.6122527122497559, -1.5451068878173828, -1.4779610633850098, -1.4108152389526367, -1.3436695337295532, -1.2765237092971802, -1.2093780040740967, -1.1422321796417236, -1.0750863552093506, -1.007940649986267, -0.940794825553894, -0.8736490607261658, -0.8065032958984375, -0.7393575310707092, -0.672211766242981, -0.6050659418106079, -0.5379201769828796, -0.47077441215515137, -0.4036286175251007, -0.33648282289505005, -0.2693370580673218, -0.2021912783384323, -0.13504549860954285, -0.06789971888065338, -0.000753939151763916, 0.06639182567596436, 0.13353762030601501, 0.20068341493606567, 0.26782894134521484, 0.3349747061729431, 0.4021205008029938, 0.46926629543304443, 0.5364120602607727, 0.603557825088501, 0.670703649520874, 0.7378494143486023, 0.8049951791763306, 0.8721409440040588, 0.9392867088317871, 1.0064325332641602, 1.0735783576965332, 1.1407240629196167, 1.2078698873519897, 1.2750155925750732, 1.3421614170074463, 1.4093072414398193, 1.4764529466629028, 1.5435987710952759, 1.6107444763183594, 1.6778903007507324, 1.7450361251831055, 1.8121819496154785, 1.879327654838562, 1.946473479270935, 2.0136191844940186, 2.0807650089263916, 2.1479108333587646, 2.2150564193725586, 2.2822022438049316, 2.3493480682373047, 2.4164938926696777]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 11.0, 6.0, 14.0, 8.0, 30.0, 44.0, 59.0, 89.0, 151.0, 305.0, 498.0, 928.0, 1760.0, 3359.0, 7088.0, 17495.0, 61316.0, 291386.0, 488149.0, 125693.0, 29619.0, 10673.0, 4759.0, 2363.0, 1214.0, 626.0, 347.0, 213.0, 132.0, 76.0, 50.0, 30.0, 21.0, 19.0, 7.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.47265625, -1.425506591796875, -1.37835693359375, -1.331207275390625, -1.2840576171875, -1.236907958984375, -1.18975830078125, -1.142608642578125, -1.095458984375, -1.048309326171875, -1.00115966796875, -0.954010009765625, -0.9068603515625, -0.859710693359375, -0.81256103515625, -0.765411376953125, -0.71826171875, -0.671112060546875, -0.62396240234375, -0.576812744140625, -0.5296630859375, -0.482513427734375, -0.43536376953125, -0.388214111328125, -0.341064453125, -0.293914794921875, -0.24676513671875, -0.199615478515625, -0.1524658203125, -0.105316162109375, -0.05816650390625, -0.011016845703125, 0.0361328125, 0.083282470703125, 0.13043212890625, 0.177581787109375, 0.2247314453125, 0.271881103515625, 0.31903076171875, 0.366180419921875, 0.413330078125, 0.460479736328125, 0.50762939453125, 0.554779052734375, 0.6019287109375, 0.649078369140625, 0.69622802734375, 0.743377685546875, 0.79052734375, 0.837677001953125, 0.88482666015625, 0.931976318359375, 0.9791259765625, 1.026275634765625, 1.07342529296875, 1.120574951171875, 1.167724609375, 1.214874267578125, 1.26202392578125, 1.309173583984375, 1.3563232421875, 1.403472900390625, 1.45062255859375, 1.497772216796875, 1.544921875]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 5.0, 8.0, 10.0, 15.0, 24.0, 39.0, 54.0, 56.0, 62.0, 71.0, 64.0, 72.0, 92.0, 83.0, 81.0, 57.0, 55.0, 50.0, 29.0, 20.0, 19.0, 14.0, 8.0, 10.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6171875, -9.2325439453125, -8.847900390625, -8.4632568359375, -8.07861328125, -7.6939697265625, -7.309326171875, -6.9246826171875, -6.5400390625, -6.1553955078125, -5.770751953125, -5.3861083984375, -5.00146484375, -4.6168212890625, -4.232177734375, -3.8475341796875, -3.462890625, -3.0782470703125, -2.693603515625, -2.3089599609375, -1.92431640625, -1.5396728515625, -1.155029296875, -0.7703857421875, -0.3857421875, -0.0010986328125, 0.383544921875, 0.7681884765625, 1.15283203125, 1.5374755859375, 1.922119140625, 2.3067626953125, 2.69140625, 3.0760498046875, 3.460693359375, 3.8453369140625, 4.22998046875, 4.6146240234375, 4.999267578125, 5.3839111328125, 5.7685546875, 6.1531982421875, 6.537841796875, 6.9224853515625, 7.30712890625, 7.6917724609375, 8.076416015625, 8.4610595703125, 8.845703125, 9.2303466796875, 9.614990234375, 9.9996337890625, 10.38427734375, 10.7689208984375, 11.153564453125, 11.5382080078125, 11.9228515625, 12.3074951171875, 12.692138671875, 13.0767822265625, 13.46142578125, 13.8460693359375, 14.230712890625, 14.6153564453125, 15.0]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 6.0, 2.0, 6.0, 12.0, 16.0, 20.0, 23.0, 31.0, 44.0, 77.0, 100.0, 236.0, 717.0, 24768.0, 1019443.0, 2207.0, 353.0, 160.0, 108.0, 50.0, 54.0, 27.0, 21.0, 22.0, 18.0, 10.0, 3.0, 6.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6953125, -12.26123046875, -11.8271484375, -11.39306640625, -10.958984375, -10.52490234375, -10.0908203125, -9.65673828125, -9.22265625, -8.78857421875, -8.3544921875, -7.92041015625, -7.486328125, -7.05224609375, -6.6181640625, -6.18408203125, -5.75, -5.31591796875, -4.8818359375, -4.44775390625, -4.013671875, -3.57958984375, -3.1455078125, -2.71142578125, -2.27734375, -1.84326171875, -1.4091796875, -0.97509765625, -0.541015625, -0.10693359375, 0.3271484375, 0.76123046875, 1.1953125, 1.62939453125, 2.0634765625, 2.49755859375, 2.931640625, 3.36572265625, 3.7998046875, 4.23388671875, 4.66796875, 5.10205078125, 5.5361328125, 5.97021484375, 6.404296875, 6.83837890625, 7.2724609375, 7.70654296875, 8.140625, 8.57470703125, 9.0087890625, 9.44287109375, 9.876953125, 10.31103515625, 10.7451171875, 11.17919921875, 11.61328125, 12.04736328125, 12.4814453125, 12.91552734375, 13.349609375, 13.78369140625, 14.2177734375, 14.65185546875, 15.0859375]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 8.0, 9.0, 8.0, 15.0, 16.0, 33.0, 27.0, 56.0, 52.0, 63.0, 78.0, 69.0, 97.0, 71.0, 79.0, 70.0, 55.0, 61.0, 31.0, 25.0, 17.0, 22.0, 13.0, 10.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.13232421875, -9.7490234375, -9.36572265625, -8.982421875, -8.59912109375, -8.2158203125, -7.83251953125, -7.44921875, -7.06591796875, -6.6826171875, -6.29931640625, -5.916015625, -5.53271484375, -5.1494140625, -4.76611328125, -4.3828125, -3.99951171875, -3.6162109375, -3.23291015625, -2.849609375, -2.46630859375, -2.0830078125, -1.69970703125, -1.31640625, -0.93310546875, -0.5498046875, -0.16650390625, 0.216796875, 0.60009765625, 0.9833984375, 1.36669921875, 1.75, 2.13330078125, 2.5166015625, 2.89990234375, 3.283203125, 3.66650390625, 4.0498046875, 4.43310546875, 4.81640625, 5.19970703125, 5.5830078125, 5.96630859375, 6.349609375, 6.73291015625, 7.1162109375, 7.49951171875, 7.8828125, 8.26611328125, 8.6494140625, 9.03271484375, 9.416015625, 9.79931640625, 10.1826171875, 10.56591796875, 10.94921875, 11.33251953125, 11.7158203125, 12.09912109375, 12.482421875, 12.86572265625, 13.2490234375, 13.63232421875, 14.015625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 6.0, 13.0, 8.0, 18.0, 29.0, 54.0, 124.0, 293.0, 972.0, 4341.0, 39233.0, 958648.0, 38984.0, 4280.0, 976.0, 318.0, 119.0, 67.0, 42.0, 5.0, 10.0, 5.0, 5.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1757354736328125, -1.139556884765625, -1.1033782958984375, -1.06719970703125, -1.0310211181640625, -0.994842529296875, -0.9586639404296875, -0.9224853515625, -0.8863067626953125, -0.850128173828125, -0.8139495849609375, -0.77777099609375, -0.7415924072265625, -0.705413818359375, -0.6692352294921875, -0.633056640625, -0.5968780517578125, -0.560699462890625, -0.5245208740234375, -0.48834228515625, -0.4521636962890625, -0.415985107421875, -0.3798065185546875, -0.3436279296875, -0.3074493408203125, -0.271270751953125, -0.2350921630859375, -0.19891357421875, -0.1627349853515625, -0.126556396484375, -0.0903778076171875, -0.05419921875, -0.0180206298828125, 0.018157958984375, 0.0543365478515625, 0.09051513671875, 0.1266937255859375, 0.162872314453125, 0.1990509033203125, 0.2352294921875, 0.2714080810546875, 0.307586669921875, 0.3437652587890625, 0.37994384765625, 0.4161224365234375, 0.452301025390625, 0.4884796142578125, 0.524658203125, 0.5608367919921875, 0.597015380859375, 0.6331939697265625, 0.66937255859375, 0.7055511474609375, 0.741729736328125, 0.7779083251953125, 0.8140869140625, 0.8502655029296875, 0.886444091796875, 0.9226226806640625, 0.95880126953125, 0.9949798583984375, 1.031158447265625, 1.0673370361328125, 1.103515625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 13.0, 21.0, 36.0, 67.0, 111.0, 331.0, 211.0, 74.0, 46.0, 22.0, 14.0, 14.0, 6.0, 5.0, 5.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018167495727539062, -0.00017672404646873474, -0.00017177313566207886, -0.00016682222485542297, -0.0001618713140487671, -0.0001569204032421112, -0.00015196949243545532, -0.00014701858162879944, -0.00014206767082214355, -0.00013711676001548767, -0.0001321658492088318, -0.0001272149384021759, -0.00012226402759552002, -0.00011731311678886414, -0.00011236220598220825, -0.00010741129517555237, -0.00010246038436889648, -9.75094735622406e-05, -9.255856275558472e-05, -8.760765194892883e-05, -8.265674114227295e-05, -7.770583033561707e-05, -7.275491952896118e-05, -6.78040087223053e-05, -6.285309791564941e-05, -5.790218710899353e-05, -5.2951276302337646e-05, -4.800036549568176e-05, -4.304945468902588e-05, -3.8098543882369995e-05, -3.314763307571411e-05, -2.8196722269058228e-05, -2.3245811462402344e-05, -1.829490065574646e-05, -1.3343989849090576e-05, -8.393079042434692e-06, -3.4421682357788086e-06, 1.5087425708770752e-06, 6.459653377532959e-06, 1.1410564184188843e-05, 1.6361474990844727e-05, 2.131238579750061e-05, 2.6263296604156494e-05, 3.121420741081238e-05, 3.616511821746826e-05, 4.1116029024124146e-05, 4.606693983078003e-05, 5.101785063743591e-05, 5.59687614440918e-05, 6.091967225074768e-05, 6.587058305740356e-05, 7.082149386405945e-05, 7.577240467071533e-05, 8.072331547737122e-05, 8.56742262840271e-05, 9.062513709068298e-05, 9.557604789733887e-05, 0.00010052695870399475, 0.00010547786951065063, 0.00011042878031730652, 0.0001153796911239624, 0.00012033060193061829, 0.00012528151273727417, 0.00013023242354393005, 0.00013518333435058594]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 4.0, 13.0, 10.0, 10.0, 18.0, 18.0, 27.0, 66.0, 112.0, 234.0, 630.0, 2214.0, 12797.0, 671016.0, 346361.0, 11746.0, 2154.0, 633.0, 194.0, 97.0, 65.0, 30.0, 18.0, 21.0, 16.0, 7.0, 3.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-1.0673828125, -1.032928466796875, -0.99847412109375, -0.964019775390625, -0.9295654296875, -0.895111083984375, -0.86065673828125, -0.826202392578125, -0.791748046875, -0.757293701171875, -0.72283935546875, -0.688385009765625, -0.6539306640625, -0.619476318359375, -0.58502197265625, -0.550567626953125, -0.51611328125, -0.481658935546875, -0.44720458984375, -0.412750244140625, -0.3782958984375, -0.343841552734375, -0.30938720703125, -0.274932861328125, -0.240478515625, -0.206024169921875, -0.17156982421875, -0.137115478515625, -0.1026611328125, -0.068206787109375, -0.03375244140625, 0.000701904296875, 0.03515625, 0.069610595703125, 0.10406494140625, 0.138519287109375, 0.1729736328125, 0.207427978515625, 0.24188232421875, 0.276336669921875, 0.310791015625, 0.345245361328125, 0.37969970703125, 0.414154052734375, 0.4486083984375, 0.483062744140625, 0.51751708984375, 0.551971435546875, 0.58642578125, 0.620880126953125, 0.65533447265625, 0.689788818359375, 0.7242431640625, 0.758697509765625, 0.79315185546875, 0.827606201171875, 0.862060546875, 0.896514892578125, 0.93096923828125, 0.965423583984375, 0.9998779296875, 1.034332275390625, 1.06878662109375, 1.103240966796875, 1.1376953125]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 11.0, 13.0, 15.0, 11.0, 12.0, 25.0, 27.0, 47.0, 61.0, 88.0, 343.0, 87.0, 60.0, 49.0, 30.0, 16.0, 13.0, 11.0, 18.0, 14.0, 6.0, 8.0, 2.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19482421875, -0.1877593994140625, -0.180694580078125, -0.1736297607421875, -0.16656494140625, -0.1595001220703125, -0.152435302734375, -0.1453704833984375, -0.1383056640625, -0.1312408447265625, -0.124176025390625, -0.1171112060546875, -0.11004638671875, -0.1029815673828125, -0.095916748046875, -0.0888519287109375, -0.081787109375, -0.0747222900390625, -0.067657470703125, -0.0605926513671875, -0.05352783203125, -0.0464630126953125, -0.039398193359375, -0.0323333740234375, -0.0252685546875, -0.0182037353515625, -0.011138916015625, -0.0040740966796875, 0.00299072265625, 0.0100555419921875, 0.017120361328125, 0.0241851806640625, 0.03125, 0.0383148193359375, 0.045379638671875, 0.0524444580078125, 0.05950927734375, 0.0665740966796875, 0.073638916015625, 0.0807037353515625, 0.0877685546875, 0.0948333740234375, 0.101898193359375, 0.1089630126953125, 0.11602783203125, 0.1230926513671875, 0.130157470703125, 0.1372222900390625, 0.144287109375, 0.1513519287109375, 0.158416748046875, 0.1654815673828125, 0.17254638671875, 0.1796112060546875, 0.186676025390625, 0.1937408447265625, 0.2008056640625, 0.2078704833984375, 0.214935302734375, 0.2220001220703125, 0.22906494140625, 0.2361297607421875, 0.243194580078125, 0.2502593994140625, 0.25732421875]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 5.0, 70.0, 491.0, 376.0, 53.0, 15.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-50.29172134399414, -49.37619400024414, -48.46066665649414, -47.54513931274414, -46.629615783691406, -45.714088439941406, -44.798561096191406, -43.883033752441406, -42.967506408691406, -42.051979064941406, -41.136451721191406, -40.220924377441406, -39.30540084838867, -38.38987350463867, -37.47434616088867, -36.55881881713867, -35.64329147338867, -34.72776412963867, -33.81223678588867, -32.89670944213867, -31.981184005737305, -31.065658569335938, -30.150131225585938, -29.234603881835938, -28.31907844543457, -27.40355110168457, -26.488025665283203, -25.572498321533203, -24.656970977783203, -23.741443634033203, -22.825918197631836, -21.910390853881836, -20.99486541748047, -20.07933807373047, -19.1638126373291, -18.2482852935791, -17.3327579498291, -16.417232513427734, -15.501705169677734, -14.586177825927734, -13.670650482177734, -12.75512409210205, -11.83959674835205, -10.924070358276367, -10.008543014526367, -9.093016624450684, -8.177490234375, -7.261962890625, -6.346435546875, -5.430908679962158, -4.515381813049316, -3.5998551845550537, -2.684328317642212, -1.7688016891479492, -0.8532748222351074, 0.062252044677734375, 0.9777789115905762, 1.893305778503418, 2.8088326454162598, 3.7243592739105225, 4.639885902404785, 5.555412769317627, 6.470939636230469, 7.3864665031433105, 8.301993370056152]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 5.0, 9.0, 5.0, 12.0, 7.0, 6.0, 12.0, 19.0, 10.0, 29.0, 21.0, 26.0, 21.0, 23.0, 29.0, 27.0, 32.0, 34.0, 48.0, 39.0, 32.0, 45.0, 35.0, 49.0, 45.0, 42.0, 35.0, 31.0, 24.0, 35.0, 27.0, 21.0, 24.0, 26.0, 21.0, 15.0, 17.0, 11.0, 7.0, 8.0, 11.0, 6.0, 4.0, 7.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-9.610380172729492, -9.327811241149902, -9.045243263244629, -8.762674331665039, -8.48010540008545, -8.19753646850586, -7.914968490600586, -7.632399559020996, -7.3498311042785645, -7.067262649536133, -6.784693717956543, -6.502125263214111, -6.21955680847168, -5.93698787689209, -5.654419422149658, -5.371850967407227, -5.089282035827637, -4.806713581085205, -4.524144649505615, -4.241576194763184, -3.959007501602173, -3.676438808441162, -3.3938703536987305, -3.1113016605377197, -2.828732967376709, -2.5461642742156982, -2.2635955810546875, -1.9810271263122559, -1.6984584331512451, -1.4158897399902344, -1.1333211660385132, -0.850752592086792, -0.5681829452514648, -0.2856143116950989, -0.00304567813873291, 0.27952295541763306, 0.562091588973999, 0.8446602821350098, 1.127228856086731, 1.4097974300384521, 1.692366123199463, 1.9749348163604736, 2.2575035095214844, 2.540071964263916, 2.8226406574249268, 3.1052093505859375, 3.387777805328369, 3.67034649848938, 3.9529151916503906, 4.235483646392822, 4.518052577972412, 4.800621032714844, 5.083189964294434, 5.365758419036865, 5.648326873779297, 5.930895805358887, 6.213464260101318, 6.49603271484375, 6.77860164642334, 7.0611701011657715, 7.343738555908203, 7.626307487487793, 7.908875942230225, 8.191444396972656, 8.474013328552246]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 5.0, 9.0, 11.0, 16.0, 21.0, 37.0, 51.0, 80.0, 121.0, 208.0, 474.0, 1400.0, 5452.0, 28731.0, 375639.0, 3621025.0, 138828.0, 16768.0, 3492.0, 1038.0, 381.0, 182.0, 114.0, 56.0, 49.0, 27.0, 23.0, 16.0, 10.0, 8.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.94921875, -4.81304931640625, -4.6768798828125, -4.54071044921875, -4.404541015625, -4.26837158203125, -4.1322021484375, -3.99603271484375, -3.85986328125, -3.72369384765625, -3.5875244140625, -3.45135498046875, -3.315185546875, -3.17901611328125, -3.0428466796875, -2.90667724609375, -2.7705078125, -2.63433837890625, -2.4981689453125, -2.36199951171875, -2.225830078125, -2.08966064453125, -1.9534912109375, -1.81732177734375, -1.68115234375, -1.54498291015625, -1.4088134765625, -1.27264404296875, -1.136474609375, -1.00030517578125, -0.8641357421875, -0.72796630859375, -0.591796875, -0.45562744140625, -0.3194580078125, -0.18328857421875, -0.047119140625, 0.08905029296875, 0.2252197265625, 0.36138916015625, 0.49755859375, 0.63372802734375, 0.7698974609375, 0.90606689453125, 1.042236328125, 1.17840576171875, 1.3145751953125, 1.45074462890625, 1.5869140625, 1.72308349609375, 1.8592529296875, 1.99542236328125, 2.131591796875, 2.26776123046875, 2.4039306640625, 2.54010009765625, 2.67626953125, 2.81243896484375, 2.9486083984375, 3.08477783203125, 3.220947265625, 3.35711669921875, 3.4932861328125, 3.62945556640625, 3.765625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 5.0, 7.0, 10.0, 17.0, 9.0, 14.0, 13.0, 24.0, 24.0, 28.0, 25.0, 25.0, 36.0, 38.0, 41.0, 54.0, 52.0, 40.0, 40.0, 42.0, 36.0, 37.0, 31.0, 45.0, 37.0, 39.0, 30.0, 26.0, 28.0, 27.0, 29.0, 14.0, 8.0, 12.0, 12.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.7255859375, -1.674560546875, -1.62353515625, -1.572509765625, -1.521484375, -1.470458984375, -1.41943359375, -1.368408203125, -1.3173828125, -1.266357421875, -1.21533203125, -1.164306640625, -1.11328125, -1.062255859375, -1.01123046875, -0.960205078125, -0.9091796875, -0.858154296875, -0.80712890625, -0.756103515625, -0.705078125, -0.654052734375, -0.60302734375, -0.552001953125, -0.5009765625, -0.449951171875, -0.39892578125, -0.347900390625, -0.296875, -0.245849609375, -0.19482421875, -0.143798828125, -0.0927734375, -0.041748046875, 0.00927734375, 0.060302734375, 0.111328125, 0.162353515625, 0.21337890625, 0.264404296875, 0.3154296875, 0.366455078125, 0.41748046875, 0.468505859375, 0.51953125, 0.570556640625, 0.62158203125, 0.672607421875, 0.7236328125, 0.774658203125, 0.82568359375, 0.876708984375, 0.927734375, 0.978759765625, 1.02978515625, 1.080810546875, 1.1318359375, 1.182861328125, 1.23388671875, 1.284912109375, 1.3359375, 1.386962890625, 1.43798828125, 1.489013671875, 1.5400390625]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 8.0, 15.0, 16.0, 31.0, 78.0, 313.0, 47126.0, 4146125.0, 377.0, 111.0, 52.0, 12.0, 9.0, 4.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.21875, -41.8720703125, -40.525390625, -39.1787109375, -37.83203125, -36.4853515625, -35.138671875, -33.7919921875, -32.4453125, -31.0986328125, -29.751953125, -28.4052734375, -27.05859375, -25.7119140625, -24.365234375, -23.0185546875, -21.671875, -20.3251953125, -18.978515625, -17.6318359375, -16.28515625, -14.9384765625, -13.591796875, -12.2451171875, -10.8984375, -9.5517578125, -8.205078125, -6.8583984375, -5.51171875, -4.1650390625, -2.818359375, -1.4716796875, -0.125, 1.2216796875, 2.568359375, 3.9150390625, 5.26171875, 6.6083984375, 7.955078125, 9.3017578125, 10.6484375, 11.9951171875, 13.341796875, 14.6884765625, 16.03515625, 17.3818359375, 18.728515625, 20.0751953125, 21.421875, 22.7685546875, 24.115234375, 25.4619140625, 26.80859375, 28.1552734375, 29.501953125, 30.8486328125, 32.1953125, 33.5419921875, 34.888671875, 36.2353515625, 37.58203125, 38.9287109375, 40.275390625, 41.6220703125, 42.96875]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 6.0, 9.0, 3.0, 6.0, 10.0, 20.0, 17.0, 40.0, 44.0, 79.0, 133.0, 186.0, 368.0, 952.0, 1139.0, 462.0, 204.0, 121.0, 96.0, 57.0, 35.0, 26.0, 17.0, 16.0, 8.0, 5.0, 5.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.88232421875, -0.8556671142578125, -0.829010009765625, -0.8023529052734375, -0.77569580078125, -0.7490386962890625, -0.722381591796875, -0.6957244873046875, -0.6690673828125, -0.6424102783203125, -0.615753173828125, -0.5890960693359375, -0.56243896484375, -0.5357818603515625, -0.509124755859375, -0.4824676513671875, -0.455810546875, -0.4291534423828125, -0.402496337890625, -0.3758392333984375, -0.34918212890625, -0.3225250244140625, -0.295867919921875, -0.2692108154296875, -0.2425537109375, -0.2158966064453125, -0.189239501953125, -0.1625823974609375, -0.13592529296875, -0.1092681884765625, -0.082611083984375, -0.0559539794921875, -0.029296875, -0.0026397705078125, 0.024017333984375, 0.0506744384765625, 0.07733154296875, 0.1039886474609375, 0.130645751953125, 0.1573028564453125, 0.1839599609375, 0.2106170654296875, 0.237274169921875, 0.2639312744140625, 0.29058837890625, 0.3172454833984375, 0.343902587890625, 0.3705596923828125, 0.397216796875, 0.4238739013671875, 0.450531005859375, 0.4771881103515625, 0.50384521484375, 0.5305023193359375, 0.557159423828125, 0.5838165283203125, 0.6104736328125, 0.6371307373046875, 0.663787841796875, 0.6904449462890625, 0.71710205078125, 0.7437591552734375, 0.770416259765625, 0.7970733642578125, 0.82373046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 14.0, 16.0, 82.0, 246.0, 376.0, 190.0, 48.0, 16.0, 6.0, 10.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-17.284709930419922, -16.941699981689453, -16.598691940307617, -16.25568199157715, -15.912673950195312, -15.56966495513916, -15.226655960083008, -14.883646011352539, -14.540637969970703, -14.19762897491455, -13.854619979858398, -13.511610984802246, -13.168601989746094, -12.825592994689941, -12.482583999633789, -12.13957405090332, -11.796565055847168, -11.453556060791016, -11.110547065734863, -10.767538070678711, -10.424529075622559, -10.081520080566406, -9.738510131835938, -9.395502090454102, -9.052492141723633, -8.70948314666748, -8.366474151611328, -8.023465156555176, -7.680456161499023, -7.337447166442871, -6.9944376945495605, -6.651428699493408, -6.3084211349487305, -5.965412139892578, -5.622403144836426, -5.279394149780273, -4.936385154724121, -4.593376159667969, -4.250366687774658, -3.907357692718506, -3.5643486976623535, -3.221339702606201, -2.878330707550049, -2.5353214740753174, -2.192312479019165, -1.8493034839630127, -1.5062942504882812, -1.163285255432129, -0.8202762603759766, -0.47726720571517944, -0.13425815105438232, 0.20875096321105957, 0.5517599582672119, 0.8947689533233643, 1.2377781867980957, 1.580787181854248, 1.9237961769104004, 2.2668051719665527, 2.609814167022705, 2.9528234004974365, 3.295832395553589, 3.638841390609741, 3.9818506240844727, 4.324859619140625, 4.667868614196777]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 7.0, 12.0, 14.0, 17.0, 21.0, 15.0, 15.0, 30.0, 21.0, 35.0, 27.0, 33.0, 33.0, 32.0, 44.0, 32.0, 47.0, 43.0, 46.0, 45.0, 40.0, 48.0, 29.0, 25.0, 27.0, 38.0, 38.0, 24.0, 17.0, 31.0, 20.0, 18.0, 9.0, 12.0, 9.0, 11.0, 6.0, 8.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.8065723180770874, -1.7518330812454224, -1.6970938444137573, -1.6423547267913818, -1.5876154899597168, -1.5328762531280518, -1.4781370162963867, -1.4233977794647217, -1.3686585426330566, -1.3139193058013916, -1.2591800689697266, -1.2044408321380615, -1.149701714515686, -1.094962477684021, -1.040223240852356, -0.9854840040206909, -0.9307448863983154, -0.8760056495666504, -0.8212664723396301, -0.7665272355079651, -0.7117880582809448, -0.6570488214492798, -0.6023095846176147, -0.5475703477859497, -0.49283117055892944, -0.4380919635295868, -0.38335275650024414, -0.3286135196685791, -0.27387431263923645, -0.2191351056098938, -0.16439586877822876, -0.10965666174888611, -0.054917335510253906, -0.00017812103033065796, 0.05456109344959259, 0.10930031538009644, 0.1640395224094391, 0.21877872943878174, 0.2735179662704468, 0.32825717329978943, 0.3829963803291321, 0.43773558735847473, 0.4924747943878174, 0.5472140312194824, 0.6019532680511475, 0.6566924452781677, 0.7114316821098328, 0.766170859336853, 0.8209100961685181, 0.8756493330001831, 0.9303885102272034, 0.9851277470588684, 1.0398669242858887, 1.0946061611175537, 1.1493453979492188, 1.2040846347808838, 1.2588238716125488, 1.3135631084442139, 1.368302345275879, 1.423041582107544, 1.4777806997299194, 1.5325199365615845, 1.5872591733932495, 1.6419984102249146, 1.69673752784729]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 8.0, 12.0, 11.0, 10.0, 28.0, 43.0, 62.0, 75.0, 108.0, 148.0, 231.0, 351.0, 504.0, 787.0, 1185.0, 2220.0, 5506.0, 23307.0, 186925.0, 695014.0, 107119.0, 15576.0, 4244.0, 1810.0, 1121.0, 684.0, 463.0, 303.0, 194.0, 157.0, 107.0, 61.0, 54.0, 36.0, 17.0, 17.0, 16.0, 10.0, 6.0, 6.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.429931640625, -0.41811370849609375, -0.4062957763671875, -0.39447784423828125, -0.382659912109375, -0.37084197998046875, -0.3590240478515625, -0.34720611572265625, -0.33538818359375, -0.32357025146484375, -0.3117523193359375, -0.29993438720703125, -0.288116455078125, -0.27629852294921875, -0.2644805908203125, -0.25266265869140625, -0.2408447265625, -0.22902679443359375, -0.2172088623046875, -0.20539093017578125, -0.193572998046875, -0.18175506591796875, -0.1699371337890625, -0.15811920166015625, -0.14630126953125, -0.13448333740234375, -0.1226654052734375, -0.11084747314453125, -0.099029541015625, -0.08721160888671875, -0.0753936767578125, -0.06357574462890625, -0.0517578125, -0.03993988037109375, -0.0281219482421875, -0.01630401611328125, -0.004486083984375, 0.00733184814453125, 0.0191497802734375, 0.03096771240234375, 0.04278564453125, 0.05460357666015625, 0.0664215087890625, 0.07823944091796875, 0.090057373046875, 0.10187530517578125, 0.1136932373046875, 0.12551116943359375, 0.1373291015625, 0.14914703369140625, 0.1609649658203125, 0.17278289794921875, 0.184600830078125, 0.19641876220703125, 0.2082366943359375, 0.22005462646484375, 0.23187255859375, 0.24369049072265625, 0.2555084228515625, 0.26732635498046875, 0.279144287109375, 0.29096221923828125, 0.3027801513671875, 0.31459808349609375, 0.326416015625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 9.0, 3.0, 4.0, 10.0, 14.0, 20.0, 14.0, 18.0, 26.0, 22.0, 26.0, 41.0, 41.0, 32.0, 31.0, 52.0, 49.0, 39.0, 57.0, 42.0, 39.0, 53.0, 37.0, 48.0, 43.0, 25.0, 31.0, 26.0, 21.0, 24.0, 19.0, 18.0, 11.0, 10.0, 10.0, 11.0, 5.0, 8.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-1.4951171875, -1.453369140625, -1.41162109375, -1.369873046875, -1.328125, -1.286376953125, -1.24462890625, -1.202880859375, -1.1611328125, -1.119384765625, -1.07763671875, -1.035888671875, -0.994140625, -0.952392578125, -0.91064453125, -0.868896484375, -0.8271484375, -0.785400390625, -0.74365234375, -0.701904296875, -0.66015625, -0.618408203125, -0.57666015625, -0.534912109375, -0.4931640625, -0.451416015625, -0.40966796875, -0.367919921875, -0.326171875, -0.284423828125, -0.24267578125, -0.200927734375, -0.1591796875, -0.117431640625, -0.07568359375, -0.033935546875, 0.0078125, 0.049560546875, 0.09130859375, 0.133056640625, 0.1748046875, 0.216552734375, 0.25830078125, 0.300048828125, 0.341796875, 0.383544921875, 0.42529296875, 0.467041015625, 0.5087890625, 0.550537109375, 0.59228515625, 0.634033203125, 0.67578125, 0.717529296875, 0.75927734375, 0.801025390625, 0.8427734375, 0.884521484375, 0.92626953125, 0.968017578125, 1.009765625, 1.051513671875, 1.09326171875, 1.135009765625, 1.1767578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 11.0, 5.0, 13.0, 15.0, 21.0, 23.0, 22.0, 44.0, 48.0, 67.0, 74.0, 96.0, 125.0, 175.0, 208.0, 254.0, 364.0, 581.0, 1256.0, 5909.0, 54955.0, 591416.0, 355772.0, 30372.0, 3806.0, 951.0, 476.0, 341.0, 230.0, 189.0, 148.0, 123.0, 99.0, 73.0, 57.0, 42.0, 49.0, 28.0, 26.0, 19.0, 16.0, 9.0, 12.0, 12.0, 8.0, 8.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2177734375, -0.21072006225585938, -0.20366668701171875, -0.19661331176757812, -0.1895599365234375, -0.18250656127929688, -0.17545318603515625, -0.16839981079101562, -0.161346435546875, -0.15429306030273438, -0.14723968505859375, -0.14018630981445312, -0.1331329345703125, -0.12607955932617188, -0.11902618408203125, -0.11197280883789062, -0.10491943359375, -0.09786605834960938, -0.09081268310546875, -0.08375930786132812, -0.0767059326171875, -0.06965255737304688, -0.06259918212890625, -0.055545806884765625, -0.048492431640625, -0.041439056396484375, -0.03438568115234375, -0.027332305908203125, -0.0202789306640625, -0.013225555419921875, -0.00617218017578125, 0.000881195068359375, 0.0079345703125, 0.014987945556640625, 0.02204132080078125, 0.029094696044921875, 0.0361480712890625, 0.043201446533203125, 0.05025482177734375, 0.057308197021484375, 0.064361572265625, 0.07141494750976562, 0.07846832275390625, 0.08552169799804688, 0.0925750732421875, 0.09962844848632812, 0.10668182373046875, 0.11373519897460938, 0.12078857421875, 0.12784194946289062, 0.13489532470703125, 0.14194869995117188, 0.1490020751953125, 0.15605545043945312, 0.16310882568359375, 0.17016220092773438, 0.177215576171875, 0.18426895141601562, 0.19132232666015625, 0.19837570190429688, 0.2054290771484375, 0.21248245239257812, 0.21953582763671875, 0.22658920288085938, 0.233642578125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 11.0, 7.0, 12.0, 13.0, 16.0, 21.0, 15.0, 32.0, 17.0, 26.0, 32.0, 30.0, 41.0, 42.0, 32.0, 38.0, 39.0, 36.0, 45.0, 34.0, 41.0, 46.0, 32.0, 34.0, 33.0, 30.0, 22.0, 26.0, 24.0, 23.0, 20.0, 12.0, 14.0, 12.0, 15.0, 12.0, 9.0, 5.0, 3.0, 4.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.8564453125, -1.7955780029296875, -1.734710693359375, -1.6738433837890625, -1.61297607421875, -1.5521087646484375, -1.491241455078125, -1.4303741455078125, -1.3695068359375, -1.3086395263671875, -1.247772216796875, -1.1869049072265625, -1.12603759765625, -1.0651702880859375, -1.004302978515625, -0.9434356689453125, -0.882568359375, -0.8217010498046875, -0.760833740234375, -0.6999664306640625, -0.63909912109375, -0.5782318115234375, -0.517364501953125, -0.4564971923828125, -0.3956298828125, -0.3347625732421875, -0.273895263671875, -0.2130279541015625, -0.15216064453125, -0.0912933349609375, -0.030426025390625, 0.0304412841796875, 0.09130859375, 0.1521759033203125, 0.213043212890625, 0.2739105224609375, 0.33477783203125, 0.3956451416015625, 0.456512451171875, 0.5173797607421875, 0.5782470703125, 0.6391143798828125, 0.699981689453125, 0.7608489990234375, 0.82171630859375, 0.8825836181640625, 0.943450927734375, 1.0043182373046875, 1.065185546875, 1.1260528564453125, 1.186920166015625, 1.2477874755859375, 1.30865478515625, 1.3695220947265625, 1.430389404296875, 1.4912567138671875, 1.5521240234375, 1.6129913330078125, 1.673858642578125, 1.7347259521484375, 1.79559326171875, 1.8564605712890625, 1.917327880859375, 1.9781951904296875, 2.0390625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 5.0, 10.0, 17.0, 27.0, 29.0, 52.0, 88.0, 145.0, 262.0, 507.0, 1117.0, 8223.0, 988035.0, 46968.0, 1688.0, 647.0, 284.0, 180.0, 97.0, 72.0, 34.0, 25.0, 19.0, 8.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.039276123046875, -0.03768491744995117, -0.036093711853027344, -0.034502506256103516, -0.03291130065917969, -0.03132009506225586, -0.02972888946533203, -0.028137683868408203, -0.026546478271484375, -0.024955272674560547, -0.02336406707763672, -0.02177286148071289, -0.020181655883789062, -0.018590450286865234, -0.016999244689941406, -0.015408039093017578, -0.01381683349609375, -0.012225627899169922, -0.010634422302246094, -0.009043216705322266, -0.0074520111083984375, -0.005860805511474609, -0.004269599914550781, -0.002678394317626953, -0.001087188720703125, 0.0005040168762207031, 0.0020952224731445312, 0.0036864280700683594, 0.0052776336669921875, 0.006868839263916016, 0.008460044860839844, 0.010051250457763672, 0.0116424560546875, 0.013233661651611328, 0.014824867248535156, 0.016416072845458984, 0.018007278442382812, 0.01959848403930664, 0.02118968963623047, 0.022780895233154297, 0.024372100830078125, 0.025963306427001953, 0.02755451202392578, 0.02914571762084961, 0.030736923217773438, 0.032328128814697266, 0.033919334411621094, 0.03551054000854492, 0.03710174560546875, 0.03869295120239258, 0.040284156799316406, 0.041875362396240234, 0.04346656799316406, 0.04505777359008789, 0.04664897918701172, 0.04824018478393555, 0.049831390380859375, 0.0514225959777832, 0.05301380157470703, 0.05460500717163086, 0.05619621276855469, 0.057787418365478516, 0.059378623962402344, 0.06096982955932617, 0.06256103515625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 10.0, 21.0, 32.0, 24.0, 52.0, 61.0, 97.0, 95.0, 110.0, 117.0, 94.0, 67.0, 60.0, 42.0, 38.0, 12.0, 12.0, 4.0, 12.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.008676528930664e-05, -1.9341707229614258e-05, -1.8596649169921875e-05, -1.7851591110229492e-05, -1.710653305053711e-05, -1.6361474990844727e-05, -1.5616416931152344e-05, -1.4871358871459961e-05, -1.4126300811767578e-05, -1.3381242752075195e-05, -1.2636184692382812e-05, -1.189112663269043e-05, -1.1146068572998047e-05, -1.0401010513305664e-05, -9.655952453613281e-06, -8.910894393920898e-06, -8.165836334228516e-06, -7.420778274536133e-06, -6.67572021484375e-06, -5.930662155151367e-06, -5.185604095458984e-06, -4.4405460357666016e-06, -3.6954879760742188e-06, -2.950429916381836e-06, -2.205371856689453e-06, -1.4603137969970703e-06, -7.152557373046875e-07, 2.9802322387695312e-08, 7.748603820800781e-07, 1.519918441772461e-06, 2.2649765014648438e-06, 3.0100345611572266e-06, 3.7550926208496094e-06, 4.500150680541992e-06, 5.245208740234375e-06, 5.990266799926758e-06, 6.735324859619141e-06, 7.4803829193115234e-06, 8.225440979003906e-06, 8.970499038696289e-06, 9.715557098388672e-06, 1.0460615158081055e-05, 1.1205673217773438e-05, 1.195073127746582e-05, 1.2695789337158203e-05, 1.3440847396850586e-05, 1.4185905456542969e-05, 1.4930963516235352e-05, 1.5676021575927734e-05, 1.6421079635620117e-05, 1.71661376953125e-05, 1.7911195755004883e-05, 1.8656253814697266e-05, 1.940131187438965e-05, 2.014636993408203e-05, 2.0891427993774414e-05, 2.1636486053466797e-05, 2.238154411315918e-05, 2.3126602172851562e-05, 2.3871660232543945e-05, 2.4616718292236328e-05, 2.536177635192871e-05, 2.6106834411621094e-05, 2.6851892471313477e-05, 2.759695053100586e-05]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 4.0, 5.0, 3.0, 7.0, 6.0, 12.0, 14.0, 17.0, 16.0, 16.0, 35.0, 66.0, 114.0, 477.0, 4234.0, 259389.0, 777929.0, 5289.0, 532.0, 117.0, 67.0, 33.0, 33.0, 25.0, 16.0, 19.0, 10.0, 4.0, 13.0, 8.0, 7.0, 2.0, 7.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13435745239257812, -0.13016510009765625, -0.12597274780273438, -0.1217803955078125, -0.11758804321289062, -0.11339569091796875, -0.10920333862304688, -0.105010986328125, -0.10081863403320312, -0.09662628173828125, -0.09243392944335938, -0.0882415771484375, -0.08404922485351562, -0.07985687255859375, -0.07566452026367188, -0.07147216796875, -0.06727981567382812, -0.06308746337890625, -0.058895111083984375, -0.0547027587890625, -0.050510406494140625, -0.04631805419921875, -0.042125701904296875, -0.037933349609375, -0.033740997314453125, -0.02954864501953125, -0.025356292724609375, -0.0211639404296875, -0.016971588134765625, -0.01277923583984375, -0.008586883544921875, -0.00439453125, -0.000202178955078125, 0.00399017333984375, 0.008182525634765625, 0.0123748779296875, 0.016567230224609375, 0.02075958251953125, 0.024951934814453125, 0.029144287109375, 0.033336639404296875, 0.03752899169921875, 0.041721343994140625, 0.0459136962890625, 0.050106048583984375, 0.05429840087890625, 0.058490753173828125, 0.06268310546875, 0.06687545776367188, 0.07106781005859375, 0.07526016235351562, 0.0794525146484375, 0.08364486694335938, 0.08783721923828125, 0.09202957153320312, 0.096221923828125, 0.10041427612304688, 0.10460662841796875, 0.10879898071289062, 0.1129913330078125, 0.11718368530273438, 0.12137603759765625, 0.12556838989257812, 0.1297607421875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 11.0, 16.0, 35.0, 38.0, 74.0, 187.0, 264.0, 190.0, 67.0, 36.0, 13.0, 14.0, 10.0, 6.0, 5.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0125885009765625, -0.012222528457641602, -0.011856555938720703, -0.011490583419799805, -0.011124610900878906, -0.010758638381958008, -0.01039266586303711, -0.010026693344116211, -0.009660720825195312, -0.009294748306274414, -0.008928775787353516, -0.008562803268432617, -0.008196830749511719, -0.00783085823059082, -0.007464885711669922, -0.0070989131927490234, -0.006732940673828125, -0.0063669681549072266, -0.006000995635986328, -0.00563502311706543, -0.005269050598144531, -0.004903078079223633, -0.004537105560302734, -0.004171133041381836, -0.0038051605224609375, -0.003439188003540039, -0.0030732154846191406, -0.002707242965698242, -0.0023412704467773438, -0.0019752979278564453, -0.0016093254089355469, -0.0012433528900146484, -0.00087738037109375, -0.0005114078521728516, -0.00014543533325195312, 0.0002205371856689453, 0.0005865097045898438, 0.0009524822235107422, 0.0013184547424316406, 0.001684427261352539, 0.0020503997802734375, 0.002416372299194336, 0.0027823448181152344, 0.003148317337036133, 0.0035142898559570312, 0.0038802623748779297, 0.004246234893798828, 0.0046122074127197266, 0.004978179931640625, 0.0053441524505615234, 0.005710124969482422, 0.00607609748840332, 0.006442070007324219, 0.006808042526245117, 0.007174015045166016, 0.007539987564086914, 0.007905960083007812, 0.008271932601928711, 0.00863790512084961, 0.009003877639770508, 0.009369850158691406, 0.009735822677612305, 0.010101795196533203, 0.010467767715454102, 0.010833740234375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 6.0, 12.0, 32.0, 202.0, 482.0, 208.0, 44.0, 9.0, 7.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.336677551269531, -14.041184425354004, -13.745691299438477, -13.45019817352295, -13.154705047607422, -12.859211921691895, -12.563718795776367, -12.26822566986084, -11.972732543945312, -11.677239418029785, -11.381746292114258, -11.08625316619873, -10.790760040283203, -10.495266914367676, -10.199773788452148, -9.904280662536621, -9.608787536621094, -9.313294410705566, -9.017801284790039, -8.722308158874512, -8.426815032958984, -8.131321907043457, -7.83582878112793, -7.540335655212402, -7.244842529296875, -6.949349403381348, -6.65385627746582, -6.358363151550293, -6.062870025634766, -5.767376899719238, -5.471883773803711, -5.176390647888184, -4.8808979988098145, -4.585404872894287, -4.28991174697876, -3.9944186210632324, -3.698925495147705, -3.4034323692321777, -3.1079392433166504, -2.812446117401123, -2.5169529914855957, -2.2214598655700684, -1.925966739654541, -1.6304736137390137, -1.3349804878234863, -1.039487361907959, -0.7439942359924316, -0.4485011100769043, -0.15300798416137695, 0.1424851417541504, 0.43797826766967773, 0.7334713935852051, 1.0289645195007324, 1.3244576454162598, 1.619950771331787, 1.9154438972473145, 2.210937023162842, 2.506430149078369, 2.8019232749938965, 3.097416400909424, 3.392909526824951, 3.6884026527404785, 3.983895778656006, 4.279388904571533, 4.5748820304870605]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 4.0, 7.0, 1.0, 10.0, 6.0, 10.0, 18.0, 22.0, 15.0, 20.0, 22.0, 35.0, 36.0, 30.0, 35.0, 39.0, 44.0, 35.0, 52.0, 46.0, 47.0, 56.0, 46.0, 40.0, 34.0, 30.0, 39.0, 38.0, 26.0, 26.0, 23.0, 30.0, 15.0, 8.0, 16.0, 8.0, 10.0, 6.0, 3.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.3640011548995972, -1.3239569664001465, -1.2839126586914062, -1.2438684701919556, -1.2038242816925049, -1.1637799739837646, -1.123735785484314, -1.0836915969848633, -1.043647289276123, -1.0036031007766724, -0.9635588526725769, -0.9235146045684814, -0.8834704160690308, -0.8434261679649353, -0.8033819198608398, -0.7633377313613892, -0.7232935428619385, -0.683249294757843, -0.6432051062583923, -0.6031608581542969, -0.5631166696548462, -0.5230724215507507, -0.4830281734466553, -0.4429839551448822, -0.40293973684310913, -0.36289551854133606, -0.322851300239563, -0.28280705213546753, -0.24276283383369446, -0.2027186155319214, -0.16267438232898712, -0.12263014912605286, -0.08258581161499023, -0.042541585862636566, -0.002497360110282898, 0.03754686564207077, 0.07759109139442444, 0.11763530969619751, 0.15767954289913177, 0.19772377610206604, 0.2377679944038391, 0.2778122127056122, 0.31785643100738525, 0.3579006791114807, 0.3979448974132538, 0.43798911571502686, 0.4780333638191223, 0.5180776119232178, 0.5581218004226685, 0.5981660485267639, 0.6382102370262146, 0.6782544851303101, 0.7182986736297607, 0.7583429217338562, 0.7983871698379517, 0.8384313583374023, 0.8784756064414978, 0.9185198545455933, 0.958564043045044, 0.9986082911491394, 1.0386525392532349, 1.0786967277526855, 1.1187409162521362, 1.1587852239608765, 1.1988294124603271]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 11.0, 12.0, 15.0, 23.0, 27.0, 44.0, 53.0, 103.0, 137.0, 225.0, 351.0, 628.0, 1101.0, 2130.0, 4295.0, 9160.0, 22758.0, 69604.0, 526633.0, 324739.0, 52382.0, 18255.0, 7986.0, 3654.0, 1921.0, 959.0, 513.0, 301.0, 185.0, 122.0, 57.0, 46.0, 30.0, 23.0, 18.0, 16.0, 5.0, 5.0, 4.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0, 2.0], "bins": [-1.4921875, -1.4517364501953125, -1.411285400390625, -1.3708343505859375, -1.33038330078125, -1.2899322509765625, -1.249481201171875, -1.2090301513671875, -1.1685791015625, -1.1281280517578125, -1.087677001953125, -1.0472259521484375, -1.00677490234375, -0.9663238525390625, -0.925872802734375, -0.8854217529296875, -0.844970703125, -0.8045196533203125, -0.764068603515625, -0.7236175537109375, -0.68316650390625, -0.6427154541015625, -0.602264404296875, -0.5618133544921875, -0.5213623046875, -0.4809112548828125, -0.440460205078125, -0.4000091552734375, -0.35955810546875, -0.3191070556640625, -0.278656005859375, -0.2382049560546875, -0.19775390625, -0.1573028564453125, -0.116851806640625, -0.0764007568359375, -0.03594970703125, 0.0045013427734375, 0.044952392578125, 0.0854034423828125, 0.1258544921875, 0.1663055419921875, 0.206756591796875, 0.2472076416015625, 0.28765869140625, 0.3281097412109375, 0.368560791015625, 0.4090118408203125, 0.449462890625, 0.4899139404296875, 0.530364990234375, 0.5708160400390625, 0.61126708984375, 0.6517181396484375, 0.692169189453125, 0.7326202392578125, 0.7730712890625, 0.8135223388671875, 0.853973388671875, 0.8944244384765625, 0.93487548828125, 0.9753265380859375, 1.015777587890625, 1.0562286376953125, 1.0966796875]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 5.0, 3.0, 7.0, 6.0, 10.0, 7.0, 14.0, 17.0, 18.0, 23.0, 27.0, 36.0, 47.0, 34.0, 35.0, 45.0, 37.0, 41.0, 53.0, 57.0, 53.0, 45.0, 45.0, 46.0, 33.0, 31.0, 28.0, 29.0, 22.0, 24.0, 24.0, 21.0, 15.0, 14.0, 7.0, 11.0, 8.0, 6.0, 6.0, 4.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.81640625, -3.7147216796875, -3.613037109375, -3.5113525390625, -3.40966796875, -3.3079833984375, -3.206298828125, -3.1046142578125, -3.0029296875, -2.9012451171875, -2.799560546875, -2.6978759765625, -2.59619140625, -2.4945068359375, -2.392822265625, -2.2911376953125, -2.189453125, -2.0877685546875, -1.986083984375, -1.8843994140625, -1.78271484375, -1.6810302734375, -1.579345703125, -1.4776611328125, -1.3759765625, -1.2742919921875, -1.172607421875, -1.0709228515625, -0.96923828125, -0.8675537109375, -0.765869140625, -0.6641845703125, -0.5625, -0.4608154296875, -0.359130859375, -0.2574462890625, -0.15576171875, -0.0540771484375, 0.047607421875, 0.1492919921875, 0.2509765625, 0.3526611328125, 0.454345703125, 0.5560302734375, 0.65771484375, 0.7593994140625, 0.861083984375, 0.9627685546875, 1.064453125, 1.1661376953125, 1.267822265625, 1.3695068359375, 1.47119140625, 1.5728759765625, 1.674560546875, 1.7762451171875, 1.8779296875, 1.9796142578125, 2.081298828125, 2.1829833984375, 2.28466796875, 2.3863525390625, 2.488037109375, 2.5897216796875, 2.69140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 5.0, 10.0, 8.0, 16.0, 15.0, 28.0, 29.0, 35.0, 63.0, 62.0, 113.0, 337.0, 1044557.0, 2842.0, 130.0, 63.0, 57.0, 47.0, 34.0, 19.0, 27.0, 13.0, 8.0, 9.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.21875, -21.539306640625, -20.85986328125, -20.180419921875, -19.5009765625, -18.821533203125, -18.14208984375, -17.462646484375, -16.783203125, -16.103759765625, -15.42431640625, -14.744873046875, -14.0654296875, -13.385986328125, -12.70654296875, -12.027099609375, -11.34765625, -10.668212890625, -9.98876953125, -9.309326171875, -8.6298828125, -7.950439453125, -7.27099609375, -6.591552734375, -5.912109375, -5.232666015625, -4.55322265625, -3.873779296875, -3.1943359375, -2.514892578125, -1.83544921875, -1.156005859375, -0.4765625, 0.202880859375, 0.88232421875, 1.561767578125, 2.2412109375, 2.920654296875, 3.60009765625, 4.279541015625, 4.958984375, 5.638427734375, 6.31787109375, 6.997314453125, 7.6767578125, 8.356201171875, 9.03564453125, 9.715087890625, 10.39453125, 11.073974609375, 11.75341796875, 12.432861328125, 13.1123046875, 13.791748046875, 14.47119140625, 15.150634765625, 15.830078125, 16.509521484375, 17.18896484375, 17.868408203125, 18.5478515625, 19.227294921875, 19.90673828125, 20.586181640625, 21.265625]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 8.0, 7.0, 10.0, 17.0, 14.0, 25.0, 31.0, 36.0, 63.0, 61.0, 73.0, 80.0, 105.0, 82.0, 86.0, 63.0, 53.0, 47.0, 36.0, 18.0, 30.0, 13.0, 8.0, 9.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.76171875, -7.5244140625, -7.287109375, -7.0498046875, -6.8125, -6.5751953125, -6.337890625, -6.1005859375, -5.86328125, -5.6259765625, -5.388671875, -5.1513671875, -4.9140625, -4.6767578125, -4.439453125, -4.2021484375, -3.96484375, -3.7275390625, -3.490234375, -3.2529296875, -3.015625, -2.7783203125, -2.541015625, -2.3037109375, -2.06640625, -1.8291015625, -1.591796875, -1.3544921875, -1.1171875, -0.8798828125, -0.642578125, -0.4052734375, -0.16796875, 0.0693359375, 0.306640625, 0.5439453125, 0.78125, 1.0185546875, 1.255859375, 1.4931640625, 1.73046875, 1.9677734375, 2.205078125, 2.4423828125, 2.6796875, 2.9169921875, 3.154296875, 3.3916015625, 3.62890625, 3.8662109375, 4.103515625, 4.3408203125, 4.578125, 4.8154296875, 5.052734375, 5.2900390625, 5.52734375, 5.7646484375, 6.001953125, 6.2392578125, 6.4765625, 6.7138671875, 6.951171875, 7.1884765625, 7.42578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 1.0, 6.0, 10.0, 15.0, 32.0, 61.0, 67.0, 156.0, 348.0, 958.0, 3239.0, 17044.0, 772024.0, 236224.0, 14087.0, 2763.0, 871.0, 305.0, 127.0, 76.0, 50.0, 29.0, 13.0, 8.0, 6.0, 8.0, 8.0, 0.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.673828125, -0.64971923828125, -0.6256103515625, -0.60150146484375, -0.577392578125, -0.55328369140625, -0.5291748046875, -0.50506591796875, -0.48095703125, -0.45684814453125, -0.4327392578125, -0.40863037109375, -0.384521484375, -0.36041259765625, -0.3363037109375, -0.31219482421875, -0.2880859375, -0.26397705078125, -0.2398681640625, -0.21575927734375, -0.191650390625, -0.16754150390625, -0.1434326171875, -0.11932373046875, -0.09521484375, -0.07110595703125, -0.0469970703125, -0.02288818359375, 0.001220703125, 0.02532958984375, 0.0494384765625, 0.07354736328125, 0.09765625, 0.12176513671875, 0.1458740234375, 0.16998291015625, 0.194091796875, 0.21820068359375, 0.2423095703125, 0.26641845703125, 0.29052734375, 0.31463623046875, 0.3387451171875, 0.36285400390625, 0.386962890625, 0.41107177734375, 0.4351806640625, 0.45928955078125, 0.4833984375, 0.50750732421875, 0.5316162109375, 0.55572509765625, 0.579833984375, 0.60394287109375, 0.6280517578125, 0.65216064453125, 0.67626953125, 0.70037841796875, 0.7244873046875, 0.74859619140625, 0.772705078125, 0.79681396484375, 0.8209228515625, 0.84503173828125, 0.869140625]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 8.0, 3.0, 10.0, 9.0, 23.0, 37.0, 55.0, 126.0, 298.0, 187.0, 94.0, 43.0, 29.0, 16.0, 12.0, 10.0, 8.0, 6.0, 7.0, 4.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.888410568237305e-05, -9.626150131225586e-05, -9.363889694213867e-05, -9.101629257202148e-05, -8.83936882019043e-05, -8.577108383178711e-05, -8.314847946166992e-05, -8.052587509155273e-05, -7.790327072143555e-05, -7.528066635131836e-05, -7.265806198120117e-05, -7.003545761108398e-05, -6.74128532409668e-05, -6.479024887084961e-05, -6.216764450073242e-05, -5.9545040130615234e-05, -5.692243576049805e-05, -5.429983139038086e-05, -5.167722702026367e-05, -4.9054622650146484e-05, -4.64320182800293e-05, -4.380941390991211e-05, -4.118680953979492e-05, -3.8564205169677734e-05, -3.594160079956055e-05, -3.331899642944336e-05, -3.069639205932617e-05, -2.8073787689208984e-05, -2.5451183319091797e-05, -2.282857894897461e-05, -2.0205974578857422e-05, -1.7583370208740234e-05, -1.4960765838623047e-05, -1.233816146850586e-05, -9.715557098388672e-06, -7.092952728271484e-06, -4.470348358154297e-06, -1.8477439880371094e-06, 7.748603820800781e-07, 3.3974647521972656e-06, 6.020069122314453e-06, 8.64267349243164e-06, 1.1265277862548828e-05, 1.3887882232666016e-05, 1.6510486602783203e-05, 1.913309097290039e-05, 2.1755695343017578e-05, 2.4378299713134766e-05, 2.7000904083251953e-05, 2.962350845336914e-05, 3.224611282348633e-05, 3.4868717193603516e-05, 3.74913215637207e-05, 4.011392593383789e-05, 4.273653030395508e-05, 4.5359134674072266e-05, 4.798173904418945e-05, 5.060434341430664e-05, 5.322694778442383e-05, 5.5849552154541016e-05, 5.84721565246582e-05, 6.109476089477539e-05, 6.371736526489258e-05, 6.633996963500977e-05, 6.896257400512695e-05]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 1.0, 4.0, 8.0, 9.0, 12.0, 24.0, 31.0, 60.0, 76.0, 114.0, 242.0, 436.0, 954.0, 2488.0, 7975.0, 42338.0, 901018.0, 75977.0, 11312.0, 3141.0, 1140.0, 559.0, 256.0, 151.0, 87.0, 55.0, 31.0, 12.0, 14.0, 6.0, 8.0, 2.0, 7.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6416015625, -0.6225204467773438, -0.6034393310546875, -0.5843582153320312, -0.565277099609375, -0.5461959838867188, -0.5271148681640625, -0.5080337524414062, -0.48895263671875, -0.46987152099609375, -0.4507904052734375, -0.43170928955078125, -0.412628173828125, -0.39354705810546875, -0.3744659423828125, -0.35538482666015625, -0.3363037109375, -0.31722259521484375, -0.2981414794921875, -0.27906036376953125, -0.259979248046875, -0.24089813232421875, -0.2218170166015625, -0.20273590087890625, -0.18365478515625, -0.16457366943359375, -0.1454925537109375, -0.12641143798828125, -0.107330322265625, -0.08824920654296875, -0.0691680908203125, -0.05008697509765625, -0.031005859375, -0.01192474365234375, 0.0071563720703125, 0.02623748779296875, 0.045318603515625, 0.06439971923828125, 0.0834808349609375, 0.10256195068359375, 0.12164306640625, 0.14072418212890625, 0.1598052978515625, 0.17888641357421875, 0.197967529296875, 0.21704864501953125, 0.2361297607421875, 0.25521087646484375, 0.2742919921875, 0.29337310791015625, 0.3124542236328125, 0.33153533935546875, 0.350616455078125, 0.36969757080078125, 0.3887786865234375, 0.40785980224609375, 0.42694091796875, 0.44602203369140625, 0.4651031494140625, 0.48418426513671875, 0.503265380859375, 0.5223464965820312, 0.5414276123046875, 0.5605087280273438, 0.57958984375]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 0.0, 2.0, 8.0, 7.0, 13.0, 16.0, 18.0, 30.0, 40.0, 82.0, 141.0, 351.0, 117.0, 67.0, 35.0, 19.0, 11.0, 13.0, 10.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2205810546875, -0.21435165405273438, -0.20812225341796875, -0.20189285278320312, -0.1956634521484375, -0.18943405151367188, -0.18320465087890625, -0.17697525024414062, -0.170745849609375, -0.16451644897460938, -0.15828704833984375, -0.15205764770507812, -0.1458282470703125, -0.13959884643554688, -0.13336944580078125, -0.12714004516601562, -0.12091064453125, -0.11468124389648438, -0.10845184326171875, -0.10222244262695312, -0.0959930419921875, -0.08976364135742188, -0.08353424072265625, -0.07730484008789062, -0.071075439453125, -0.06484603881835938, -0.05861663818359375, -0.052387237548828125, -0.0461578369140625, -0.039928436279296875, -0.03369903564453125, -0.027469635009765625, -0.021240234375, -0.015010833740234375, -0.00878143310546875, -0.002552032470703125, 0.0036773681640625, 0.009906768798828125, 0.01613616943359375, 0.022365570068359375, 0.028594970703125, 0.034824371337890625, 0.04105377197265625, 0.047283172607421875, 0.0535125732421875, 0.059741973876953125, 0.06597137451171875, 0.07220077514648438, 0.07843017578125, 0.08465957641601562, 0.09088897705078125, 0.09711837768554688, 0.1033477783203125, 0.10957717895507812, 0.11580657958984375, 0.12203598022460938, 0.128265380859375, 0.13449478149414062, 0.14072418212890625, 0.14695358276367188, 0.1531829833984375, 0.15941238403320312, 0.16564178466796875, 0.17187118530273438, 0.1781005859375]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 13.0, 15.0, 34.0, 115.0, 243.0, 285.0, 163.0, 61.0, 36.0, 11.0, 8.0, 5.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.668109893798828, -12.3677339553833, -12.06735897064209, -11.766983032226562, -11.466608047485352, -11.166232109069824, -10.865856170654297, -10.565481185913086, -10.265105247497559, -9.964729309082031, -9.66435432434082, -9.363978385925293, -9.063603401184082, -8.763227462768555, -8.462852478027344, -8.162476539611816, -7.862101078033447, -7.561725616455078, -7.261350154876709, -6.96097469329834, -6.6605987548828125, -6.360223293304443, -6.059847831726074, -5.759471893310547, -5.459096908569336, -5.158721446990967, -4.858345985412598, -4.55797004699707, -4.257594585418701, -3.957219123840332, -3.656843662261963, -3.3564679622650146, -3.0560927391052246, -2.7557172775268555, -2.4553415775299072, -2.154966115951538, -1.8545905351638794, -1.5542149543762207, -1.2538394927978516, -0.9534637928009033, -0.6530883312225342, -0.3527127802371979, -0.05233722925186157, 0.24803829193115234, 0.548413872718811, 0.8487894535064697, 1.1491649150848389, 1.449540615081787, 1.7499160766601562, 2.0502915382385254, 2.3506672382354736, 2.6510426998138428, 2.951418399810791, 3.25179386138916, 3.5521693229675293, 3.8525450229644775, 4.152920722961426, 4.453296184539795, 4.753671646118164, 5.054047584533691, 5.3544230461120605, 5.65479850769043, 5.955173969268799, 6.255549430847168, 6.555924892425537]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 6.0, 5.0, 8.0, 17.0, 10.0, 12.0, 22.0, 13.0, 27.0, 24.0, 34.0, 34.0, 32.0, 46.0, 53.0, 60.0, 47.0, 35.0, 45.0, 38.0, 56.0, 49.0, 38.0, 46.0, 45.0, 33.0, 26.0, 27.0, 21.0, 22.0, 23.0, 7.0, 11.0, 7.0, 4.0, 7.0, 4.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.450930118560791, -7.241085529327393, -7.031241416931152, -6.821396827697754, -6.6115522384643555, -6.401707649230957, -6.191863536834717, -5.982018947601318, -5.772174835205078, -5.56233024597168, -5.3524861335754395, -5.142641544342041, -4.932796955108643, -4.722952842712402, -4.513108253479004, -4.3032636642456055, -4.093419075012207, -3.8835747241973877, -3.6737301349639893, -3.46388578414917, -3.2540411949157715, -3.044196844100952, -2.834352493286133, -2.6245079040527344, -2.414663553237915, -2.2048192024230957, -1.9949746131896973, -1.785130262374878, -1.575285792350769, -1.3654413223266602, -1.1555969715118408, -0.9457525014877319, -0.735908031463623, -0.5260635614395142, -0.31621915102005005, -0.10637474060058594, 0.10346972942352295, 0.31331419944763184, 0.5231585502624512, 0.7330030202865601, 0.942847490310669, 1.1526919603347778, 1.3625364303588867, 1.572380781173706, 1.782225251197815, 1.9920697212219238, 2.201914072036743, 2.4117584228515625, 2.621603012084961, 2.8314473628997803, 3.0412919521331787, 3.251136302947998, 3.4609808921813965, 3.670825242996216, 3.880669593811035, 4.090514183044434, 4.300358772277832, 4.5102033615112305, 4.720047473907471, 4.929892063140869, 5.139736652374268, 5.349580764770508, 5.559425354003906, 5.769269943237305, 5.979114055633545]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 5.0, 7.0, 7.0, 14.0, 6.0, 15.0, 20.0, 25.0, 29.0, 37.0, 73.0, 78.0, 148.0, 322.0, 777.0, 2909.0, 15151.0, 218424.0, 3837478.0, 105163.0, 10207.0, 2088.0, 630.0, 247.0, 139.0, 71.0, 61.0, 31.0, 26.0, 14.0, 11.0, 16.0, 14.0, 10.0, 6.0, 7.0, 3.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.09735107421875, -4.9447021484375, -4.79205322265625, -4.639404296875, -4.48675537109375, -4.3341064453125, -4.18145751953125, -4.02880859375, -3.87615966796875, -3.7235107421875, -3.57086181640625, -3.418212890625, -3.26556396484375, -3.1129150390625, -2.96026611328125, -2.8076171875, -2.65496826171875, -2.5023193359375, -2.34967041015625, -2.197021484375, -2.04437255859375, -1.8917236328125, -1.73907470703125, -1.58642578125, -1.43377685546875, -1.2811279296875, -1.12847900390625, -0.975830078125, -0.82318115234375, -0.6705322265625, -0.51788330078125, -0.365234375, -0.21258544921875, -0.0599365234375, 0.09271240234375, 0.245361328125, 0.39801025390625, 0.5506591796875, 0.70330810546875, 0.85595703125, 1.00860595703125, 1.1612548828125, 1.31390380859375, 1.466552734375, 1.61920166015625, 1.7718505859375, 1.92449951171875, 2.0771484375, 2.22979736328125, 2.3824462890625, 2.53509521484375, 2.687744140625, 2.84039306640625, 2.9930419921875, 3.14569091796875, 3.29833984375, 3.45098876953125, 3.6036376953125, 3.75628662109375, 3.908935546875, 4.06158447265625, 4.2142333984375, 4.36688232421875, 4.51953125]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 6.0, 10.0, 11.0, 5.0, 9.0, 18.0, 17.0, 25.0, 28.0, 35.0, 40.0, 47.0, 56.0, 51.0, 50.0, 68.0, 58.0, 59.0, 48.0, 52.0, 49.0, 38.0, 37.0, 26.0, 20.0, 33.0, 23.0, 19.0, 10.0, 8.0, 9.0, 10.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.796875, -1.7444610595703125, -1.692047119140625, -1.6396331787109375, -1.58721923828125, -1.5348052978515625, -1.482391357421875, -1.4299774169921875, -1.3775634765625, -1.3251495361328125, -1.272735595703125, -1.2203216552734375, -1.16790771484375, -1.1154937744140625, -1.063079833984375, -1.0106658935546875, -0.958251953125, -0.9058380126953125, -0.853424072265625, -0.8010101318359375, -0.74859619140625, -0.6961822509765625, -0.643768310546875, -0.5913543701171875, -0.5389404296875, -0.4865264892578125, -0.434112548828125, -0.3816986083984375, -0.32928466796875, -0.2768707275390625, -0.224456787109375, -0.1720428466796875, -0.11962890625, -0.0672149658203125, -0.014801025390625, 0.0376129150390625, 0.09002685546875, 0.1424407958984375, 0.194854736328125, 0.2472686767578125, 0.2996826171875, 0.3520965576171875, 0.404510498046875, 0.4569244384765625, 0.50933837890625, 0.5617523193359375, 0.614166259765625, 0.6665802001953125, 0.718994140625, 0.7714080810546875, 0.823822021484375, 0.8762359619140625, 0.92864990234375, 0.9810638427734375, 1.033477783203125, 1.0858917236328125, 1.1383056640625, 1.1907196044921875, 1.243133544921875, 1.2955474853515625, 1.34796142578125, 1.4003753662109375, 1.452789306640625, 1.5052032470703125, 1.5576171875]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 12.0, 30.0, 158.0, 4463.0, 4187854.0, 1613.0, 108.0, 26.0, 9.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.125, -33.3565673828125, -32.588134765625, -31.8197021484375, -31.05126953125, -30.2828369140625, -29.514404296875, -28.7459716796875, -27.9775390625, -27.2091064453125, -26.440673828125, -25.6722412109375, -24.90380859375, -24.1353759765625, -23.366943359375, -22.5985107421875, -21.830078125, -21.0616455078125, -20.293212890625, -19.5247802734375, -18.75634765625, -17.9879150390625, -17.219482421875, -16.4510498046875, -15.6826171875, -14.9141845703125, -14.145751953125, -13.3773193359375, -12.60888671875, -11.8404541015625, -11.072021484375, -10.3035888671875, -9.53515625, -8.7667236328125, -7.998291015625, -7.2298583984375, -6.46142578125, -5.6929931640625, -4.924560546875, -4.1561279296875, -3.3876953125, -2.6192626953125, -1.850830078125, -1.0823974609375, -0.31396484375, 0.4544677734375, 1.222900390625, 1.9913330078125, 2.759765625, 3.5281982421875, 4.296630859375, 5.0650634765625, 5.83349609375, 6.6019287109375, 7.370361328125, 8.1387939453125, 8.9072265625, 9.6756591796875, 10.444091796875, 11.2125244140625, 11.98095703125, 12.7493896484375, 13.517822265625, 14.2862548828125, 15.0546875]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 7.0, 15.0, 17.0, 28.0, 34.0, 71.0, 99.0, 143.0, 288.0, 687.0, 1466.0, 506.0, 245.0, 177.0, 110.0, 69.0, 39.0, 28.0, 12.0, 7.0, 7.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.560546875, -0.534332275390625, -0.50811767578125, -0.481903076171875, -0.4556884765625, -0.429473876953125, -0.40325927734375, -0.377044677734375, -0.350830078125, -0.324615478515625, -0.29840087890625, -0.272186279296875, -0.2459716796875, -0.219757080078125, -0.19354248046875, -0.167327880859375, -0.14111328125, -0.114898681640625, -0.08868408203125, -0.062469482421875, -0.0362548828125, -0.010040283203125, 0.01617431640625, 0.042388916015625, 0.068603515625, 0.094818115234375, 0.12103271484375, 0.147247314453125, 0.1734619140625, 0.199676513671875, 0.22589111328125, 0.252105712890625, 0.2783203125, 0.304534912109375, 0.33074951171875, 0.356964111328125, 0.3831787109375, 0.409393310546875, 0.43560791015625, 0.461822509765625, 0.488037109375, 0.514251708984375, 0.54046630859375, 0.566680908203125, 0.5928955078125, 0.619110107421875, 0.64532470703125, 0.671539306640625, 0.69775390625, 0.723968505859375, 0.75018310546875, 0.776397705078125, 0.8026123046875, 0.828826904296875, 0.85504150390625, 0.881256103515625, 0.907470703125, 0.933685302734375, 0.95989990234375, 0.986114501953125, 1.0123291015625, 1.038543701171875, 1.06475830078125, 1.090972900390625, 1.1171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 1.0, 7.0, 13.0, 8.0, 14.0, 28.0, 29.0, 71.0, 120.0, 156.0, 214.0, 130.0, 80.0, 48.0, 24.0, 16.0, 11.0, 12.0, 5.0, 2.0, 6.0, 0.0, 1.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.755366802215576, -4.611855983734131, -4.4683451652526855, -4.32483434677124, -4.181323528289795, -4.03781270980835, -3.8943018913269043, -3.750791072845459, -3.6072802543640137, -3.4637694358825684, -3.320258617401123, -3.1767477989196777, -3.0332369804382324, -2.889726161956787, -2.746215343475342, -2.6027045249938965, -2.4591939449310303, -2.315683126449585, -2.1721723079681396, -2.0286614894866943, -1.885150671005249, -1.7416398525238037, -1.598129153251648, -1.4546183347702026, -1.3111075162887573, -1.167596697807312, -1.0240858793258667, -0.8805751204490662, -0.7370643019676208, -0.5935534834861755, -0.450042724609375, -0.3065319061279297, -0.16302108764648438, -0.019510284066200256, 0.12400051951408386, 0.2675113081932068, 0.4110221266746521, 0.5545329451560974, 0.698043704032898, 0.8415545225143433, 0.9850653409957886, 1.1285761594772339, 1.2720869779586792, 1.415597677230835, 1.5591084957122803, 1.7026193141937256, 1.846130132675171, 1.9896409511566162, 2.1331517696380615, 2.276662588119507, 2.420173406600952, 2.5636842250823975, 2.7071950435638428, 2.850705862045288, 2.9942164421081543, 3.1377272605895996, 3.281238079071045, 3.4247488975524902, 3.5682597160339355, 3.711770534515381, 3.855281352996826, 3.9987921714782715, 4.142302989959717, 4.285813808441162, 4.429324626922607]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 3.0, 6.0, 7.0, 8.0, 3.0, 4.0, 9.0, 14.0, 18.0, 15.0, 19.0, 29.0, 40.0, 41.0, 52.0, 50.0, 52.0, 42.0, 54.0, 46.0, 55.0, 40.0, 58.0, 40.0, 32.0, 47.0, 38.0, 26.0, 22.0, 20.0, 22.0, 13.0, 12.0, 17.0, 17.0, 5.0, 11.0, 4.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8465375900268555, -1.7900300025939941, -1.7335222959518433, -1.6770145893096924, -1.620507001876831, -1.5639994144439697, -1.5074917078018188, -1.450984001159668, -1.3944764137268066, -1.3379688262939453, -1.2814611196517944, -1.2249534130096436, -1.1684458255767822, -1.111938238143921, -1.05543053150177, -0.9989228844642639, -0.9424152374267578, -0.8859075903892517, -0.8293999433517456, -0.7728922963142395, -0.7163846492767334, -0.6598770022392273, -0.6033693552017212, -0.5468617081642151, -0.490354061126709, -0.4338464140892029, -0.3773387670516968, -0.3208311200141907, -0.26432347297668457, -0.20781582593917847, -0.15130817890167236, -0.09480053186416626, -0.03829300403594971, 0.018214643001556396, 0.0747222900390625, 0.1312299370765686, 0.1877375841140747, 0.2442452311515808, 0.3007528781890869, 0.357260525226593, 0.4137681722640991, 0.4702758193016052, 0.5267834663391113, 0.5832911133766174, 0.6397987604141235, 0.6963064074516296, 0.7528140544891357, 0.8093217015266418, 0.865829348564148, 0.922336995601654, 0.9788446426391602, 1.0353522300720215, 1.0918599367141724, 1.1483676433563232, 1.2048752307891846, 1.261382818222046, 1.3178905248641968, 1.3743982315063477, 1.430905818939209, 1.4874134063720703, 1.5439211130142212, 1.600428819656372, 1.6569364070892334, 1.7134439945220947, 1.7699517011642456]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 0.0, 8.0, 21.0, 21.0, 21.0, 22.0, 29.0, 63.0, 92.0, 148.0, 224.0, 458.0, 836.0, 1750.0, 4785.0, 26718.0, 815720.0, 181080.0, 10823.0, 2920.0, 1261.0, 632.0, 381.0, 192.0, 134.0, 75.0, 30.0, 29.0, 16.0, 18.0, 11.0, 4.0, 9.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.4609375, -0.4459648132324219, -0.43099212646484375, -0.4160194396972656, -0.4010467529296875, -0.3860740661621094, -0.37110137939453125, -0.3561286926269531, -0.341156005859375, -0.3261833190917969, -0.31121063232421875, -0.2962379455566406, -0.2812652587890625, -0.2662925720214844, -0.25131988525390625, -0.23634719848632812, -0.22137451171875, -0.20640182495117188, -0.19142913818359375, -0.17645645141601562, -0.1614837646484375, -0.14651107788085938, -0.13153839111328125, -0.11656570434570312, -0.101593017578125, -0.08662033081054688, -0.07164764404296875, -0.056674957275390625, -0.0417022705078125, -0.026729583740234375, -0.01175689697265625, 0.003215789794921875, 0.0181884765625, 0.033161163330078125, 0.04813385009765625, 0.06310653686523438, 0.0780792236328125, 0.09305191040039062, 0.10802459716796875, 0.12299728393554688, 0.137969970703125, 0.15294265747070312, 0.16791534423828125, 0.18288803100585938, 0.1978607177734375, 0.21283340454101562, 0.22780609130859375, 0.24277877807617188, 0.25775146484375, 0.2727241516113281, 0.28769683837890625, 0.3026695251464844, 0.3176422119140625, 0.3326148986816406, 0.34758758544921875, 0.3625602722167969, 0.377532958984375, 0.3925056457519531, 0.40747833251953125, 0.4224510192871094, 0.4374237060546875, 0.4523963928222656, 0.46736907958984375, 0.4823417663574219, 0.497314453125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 2.0, 4.0, 6.0, 4.0, 5.0, 12.0, 7.0, 7.0, 12.0, 14.0, 25.0, 37.0, 27.0, 41.0, 63.0, 60.0, 70.0, 51.0, 50.0, 72.0, 55.0, 47.0, 45.0, 43.0, 44.0, 33.0, 30.0, 27.0, 17.0, 13.0, 17.0, 17.0, 10.0, 15.0, 5.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3525390625, -1.311553955078125, -1.27056884765625, -1.229583740234375, -1.1885986328125, -1.147613525390625, -1.10662841796875, -1.065643310546875, -1.024658203125, -0.983673095703125, -0.94268798828125, -0.901702880859375, -0.8607177734375, -0.819732666015625, -0.77874755859375, -0.737762451171875, -0.69677734375, -0.655792236328125, -0.61480712890625, -0.573822021484375, -0.5328369140625, -0.491851806640625, -0.45086669921875, -0.409881591796875, -0.368896484375, -0.327911376953125, -0.28692626953125, -0.245941162109375, -0.2049560546875, -0.163970947265625, -0.12298583984375, -0.082000732421875, -0.041015625, -3.0517578125e-05, 0.04095458984375, 0.081939697265625, 0.1229248046875, 0.163909912109375, 0.20489501953125, 0.245880126953125, 0.286865234375, 0.327850341796875, 0.36883544921875, 0.409820556640625, 0.4508056640625, 0.491790771484375, 0.53277587890625, 0.573760986328125, 0.61474609375, 0.655731201171875, 0.69671630859375, 0.737701416015625, 0.7786865234375, 0.819671630859375, 0.86065673828125, 0.901641845703125, 0.942626953125, 0.983612060546875, 1.02459716796875, 1.065582275390625, 1.1065673828125, 1.147552490234375, 1.18853759765625, 1.229522705078125, 1.2705078125]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 1.0, 6.0, 5.0, 13.0, 12.0, 21.0, 18.0, 17.0, 33.0, 41.0, 55.0, 63.0, 122.0, 158.0, 282.0, 466.0, 1247.0, 5436.0, 53881.0, 738085.0, 229383.0, 14984.0, 2416.0, 746.0, 318.0, 206.0, 139.0, 113.0, 75.0, 54.0, 39.0, 30.0, 19.0, 25.0, 14.0, 6.0, 8.0, 3.0, 5.0, 7.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2059326171875, -0.1994457244873047, -0.19295883178710938, -0.18647193908691406, -0.17998504638671875, -0.17349815368652344, -0.16701126098632812, -0.1605243682861328, -0.1540374755859375, -0.1475505828857422, -0.14106369018554688, -0.13457679748535156, -0.12808990478515625, -0.12160301208496094, -0.11511611938476562, -0.10862922668457031, -0.102142333984375, -0.09565544128417969, -0.08916854858398438, -0.08268165588378906, -0.07619476318359375, -0.06970787048339844, -0.06322097778320312, -0.05673408508300781, -0.0502471923828125, -0.04376029968261719, -0.037273406982421875, -0.030786514282226562, -0.02429962158203125, -0.017812728881835938, -0.011325836181640625, -0.0048389434814453125, 0.00164794921875, 0.008134841918945312, 0.014621734619140625, 0.021108627319335938, 0.02759552001953125, 0.03408241271972656, 0.040569305419921875, 0.04705619812011719, 0.0535430908203125, 0.06002998352050781, 0.06651687622070312, 0.07300376892089844, 0.07949066162109375, 0.08597755432128906, 0.09246444702148438, 0.09895133972167969, 0.105438232421875, 0.11192512512207031, 0.11841201782226562, 0.12489891052246094, 0.13138580322265625, 0.13787269592285156, 0.14435958862304688, 0.1508464813232422, 0.1573333740234375, 0.1638202667236328, 0.17030715942382812, 0.17679405212402344, 0.18328094482421875, 0.18976783752441406, 0.19625473022460938, 0.2027416229248047, 0.209228515625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 9.0, 16.0, 11.0, 16.0, 19.0, 18.0, 20.0, 36.0, 21.0, 32.0, 24.0, 52.0, 43.0, 44.0, 59.0, 60.0, 41.0, 52.0, 38.0, 45.0, 54.0, 42.0, 32.0, 48.0, 22.0, 27.0, 24.0, 23.0, 14.0, 13.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8505859375, -1.7871551513671875, -1.723724365234375, -1.6602935791015625, -1.59686279296875, -1.5334320068359375, -1.470001220703125, -1.4065704345703125, -1.3431396484375, -1.2797088623046875, -1.216278076171875, -1.1528472900390625, -1.08941650390625, -1.0259857177734375, -0.962554931640625, -0.8991241455078125, -0.835693359375, -0.7722625732421875, -0.708831787109375, -0.6454010009765625, -0.58197021484375, -0.5185394287109375, -0.455108642578125, -0.3916778564453125, -0.3282470703125, -0.2648162841796875, -0.201385498046875, -0.1379547119140625, -0.07452392578125, -0.0110931396484375, 0.052337646484375, 0.1157684326171875, 0.17919921875, 0.2426300048828125, 0.306060791015625, 0.3694915771484375, 0.43292236328125, 0.4963531494140625, 0.559783935546875, 0.6232147216796875, 0.6866455078125, 0.7500762939453125, 0.813507080078125, 0.8769378662109375, 0.94036865234375, 1.0037994384765625, 1.067230224609375, 1.1306610107421875, 1.194091796875, 1.2575225830078125, 1.320953369140625, 1.3843841552734375, 1.44781494140625, 1.5112457275390625, 1.574676513671875, 1.6381072998046875, 1.7015380859375, 1.7649688720703125, 1.828399658203125, 1.8918304443359375, 1.95526123046875, 2.0186920166015625, 2.082122802734375, 2.1455535888671875, 2.208984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 5.0, 6.0, 7.0, 10.0, 6.0, 14.0, 28.0, 57.0, 89.0, 201.0, 832.0, 14911.0, 1027949.0, 3640.0, 493.0, 130.0, 82.0, 29.0, 18.0, 15.0, 13.0, 5.0, 3.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.2421875, -0.2360248565673828, -0.22986221313476562, -0.22369956970214844, -0.21753692626953125, -0.21137428283691406, -0.20521163940429688, -0.1990489959716797, -0.1928863525390625, -0.1867237091064453, -0.18056106567382812, -0.17439842224121094, -0.16823577880859375, -0.16207313537597656, -0.15591049194335938, -0.1497478485107422, -0.143585205078125, -0.1374225616455078, -0.13125991821289062, -0.12509727478027344, -0.11893463134765625, -0.11277198791503906, -0.10660934448242188, -0.10044670104980469, -0.0942840576171875, -0.08812141418457031, -0.08195877075195312, -0.07579612731933594, -0.06963348388671875, -0.06347084045410156, -0.057308197021484375, -0.05114555358886719, -0.04498291015625, -0.03882026672363281, -0.032657623291015625, -0.026494979858398438, -0.02033233642578125, -0.014169692993164062, -0.008007049560546875, -0.0018444061279296875, 0.0043182373046875, 0.010480880737304688, 0.016643524169921875, 0.022806167602539062, 0.02896881103515625, 0.03513145446777344, 0.041294097900390625, 0.04745674133300781, 0.053619384765625, 0.05978202819824219, 0.06594467163085938, 0.07210731506347656, 0.07826995849609375, 0.08443260192871094, 0.09059524536132812, 0.09675788879394531, 0.1029205322265625, 0.10908317565917969, 0.11524581909179688, 0.12140846252441406, 0.12757110595703125, 0.13373374938964844, 0.13989639282226562, 0.1460590362548828, 0.1522216796875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 2.0, 8.0, 11.0, 10.0, 27.0, 37.0, 59.0, 91.0, 148.0, 151.0, 125.0, 119.0, 70.0, 42.0, 37.0, 30.0, 13.0, 5.0, 5.0, 6.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.913309097290039e-05, -1.825764775276184e-05, -1.738220453262329e-05, -1.650676131248474e-05, -1.563131809234619e-05, -1.4755874872207642e-05, -1.3880431652069092e-05, -1.3004988431930542e-05, -1.2129545211791992e-05, -1.1254101991653442e-05, -1.0378658771514893e-05, -9.503215551376343e-06, -8.627772331237793e-06, -7.752329111099243e-06, -6.876885890960693e-06, -6.0014426708221436e-06, -5.125999450683594e-06, -4.250556230545044e-06, -3.375113010406494e-06, -2.4996697902679443e-06, -1.6242265701293945e-06, -7.487833499908447e-07, 1.2665987014770508e-07, 1.0021030902862549e-06, 1.8775463104248047e-06, 2.7529895305633545e-06, 3.6284327507019043e-06, 4.503875970840454e-06, 5.379319190979004e-06, 6.254762411117554e-06, 7.1302056312561035e-06, 8.005648851394653e-06, 8.881092071533203e-06, 9.756535291671753e-06, 1.0631978511810303e-05, 1.1507421731948853e-05, 1.2382864952087402e-05, 1.3258308172225952e-05, 1.4133751392364502e-05, 1.5009194612503052e-05, 1.58846378326416e-05, 1.676008105278015e-05, 1.76355242729187e-05, 1.851096749305725e-05, 1.93864107131958e-05, 2.026185393333435e-05, 2.11372971534729e-05, 2.201274037361145e-05, 2.288818359375e-05, 2.376362681388855e-05, 2.46390700340271e-05, 2.551451325416565e-05, 2.63899564743042e-05, 2.726539969444275e-05, 2.81408429145813e-05, 2.901628613471985e-05, 2.98917293548584e-05, 3.076717257499695e-05, 3.16426157951355e-05, 3.251805901527405e-05, 3.33935022354126e-05, 3.426894545555115e-05, 3.51443886756897e-05, 3.601983189582825e-05, 3.68952751159668e-05]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 1.0, 8.0, 8.0, 11.0, 21.0, 22.0, 55.0, 88.0, 161.0, 282.0, 651.0, 1894.0, 7260.0, 99331.0, 918212.0, 15632.0, 2989.0, 997.0, 416.0, 201.0, 113.0, 57.0, 36.0, 33.0, 20.0, 12.0, 10.0, 9.0, 7.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10113525390625, -0.0976724624633789, -0.09420967102050781, -0.09074687957763672, -0.08728408813476562, -0.08382129669189453, -0.08035850524902344, -0.07689571380615234, -0.07343292236328125, -0.06997013092041016, -0.06650733947753906, -0.06304454803466797, -0.059581756591796875, -0.05611896514892578, -0.05265617370605469, -0.049193382263183594, -0.0457305908203125, -0.042267799377441406, -0.03880500793457031, -0.03534221649169922, -0.031879425048828125, -0.02841663360595703, -0.024953842163085938, -0.021491050720214844, -0.01802825927734375, -0.014565467834472656, -0.011102676391601562, -0.007639884948730469, -0.004177093505859375, -0.0007143020629882812, 0.0027484893798828125, 0.006211280822753906, 0.009674072265625, 0.013136863708496094, 0.016599655151367188, 0.02006244659423828, 0.023525238037109375, 0.02698802947998047, 0.030450820922851562, 0.033913612365722656, 0.03737640380859375, 0.040839195251464844, 0.04430198669433594, 0.04776477813720703, 0.051227569580078125, 0.05469036102294922, 0.05815315246582031, 0.061615943908691406, 0.0650787353515625, 0.0685415267944336, 0.07200431823730469, 0.07546710968017578, 0.07892990112304688, 0.08239269256591797, 0.08585548400878906, 0.08931827545166016, 0.09278106689453125, 0.09624385833740234, 0.09970664978027344, 0.10316944122314453, 0.10663223266601562, 0.11009502410888672, 0.11355781555175781, 0.1170206069946289, 0.1204833984375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 6.0, 10.0, 8.0, 7.0, 14.0, 23.0, 44.0, 77.0, 274.0, 350.0, 74.0, 41.0, 23.0, 14.0, 6.0, 10.0, 3.0, 6.0, 3.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012542724609375, -0.011848926544189453, -0.011155128479003906, -0.01046133041381836, -0.009767532348632812, -0.009073734283447266, -0.008379936218261719, -0.007686138153076172, -0.006992340087890625, -0.006298542022705078, -0.005604743957519531, -0.004910945892333984, -0.0042171478271484375, -0.0035233497619628906, -0.0028295516967773438, -0.002135753631591797, -0.00144195556640625, -0.0007481575012207031, -5.435943603515625e-05, 0.0006394386291503906, 0.0013332366943359375, 0.0020270347595214844, 0.0027208328247070312, 0.003414630889892578, 0.004108428955078125, 0.004802227020263672, 0.005496025085449219, 0.006189823150634766, 0.0068836212158203125, 0.007577419281005859, 0.008271217346191406, 0.008965015411376953, 0.0096588134765625, 0.010352611541748047, 0.011046409606933594, 0.01174020767211914, 0.012434005737304688, 0.013127803802490234, 0.013821601867675781, 0.014515399932861328, 0.015209197998046875, 0.015902996063232422, 0.01659679412841797, 0.017290592193603516, 0.017984390258789062, 0.01867818832397461, 0.019371986389160156, 0.020065784454345703, 0.02075958251953125, 0.021453380584716797, 0.022147178649902344, 0.02284097671508789, 0.023534774780273438, 0.024228572845458984, 0.02492237091064453, 0.025616168975830078, 0.026309967041015625, 0.027003765106201172, 0.02769756317138672, 0.028391361236572266, 0.029085159301757812, 0.02977895736694336, 0.030472755432128906, 0.031166553497314453, 0.0318603515625]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 12.0, 12.0, 32.0, 46.0, 108.0, 209.0, 261.0, 137.0, 77.0, 30.0, 13.0, 19.0, 10.0, 6.0, 6.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.129145622253418, -4.015045166015625, -3.900944709777832, -3.786844253540039, -3.672743558883667, -3.558643102645874, -3.444542646408081, -3.330442190170288, -3.216341495513916, -3.102241039276123, -2.98814058303833, -2.874040126800537, -2.759939432144165, -2.645838975906372, -2.531738519668579, -2.417638063430786, -2.303537607192993, -2.1894371509552, -2.0753366947174072, -1.9612361192703247, -1.8471355438232422, -1.7330350875854492, -1.6189346313476562, -1.5048341751098633, -1.3907335996627808, -1.2766331434249878, -1.1625325679779053, -1.0484321117401123, -0.9343315958976746, -0.8202310800552368, -0.7061306238174438, -0.5920301079750061, -0.47792959213256836, -0.3638290762901306, -0.24972859025001526, -0.1356281042098999, -0.021527588367462158, 0.09257292747497559, 0.20667338371276855, 0.3207738995552063, 0.43487441539764404, 0.5489749312400818, 0.6630754470825195, 0.7771759033203125, 0.8912764191627502, 1.005376935005188, 1.119477391242981, 1.2335779666900635, 1.3476784229278564, 1.4617788791656494, 1.575879454612732, 1.689979910850525, 1.8040804862976074, 1.9181809425354004, 2.0322813987731934, 2.1463818550109863, 2.2604823112487793, 2.3745827674865723, 2.4886832237243652, 2.602783679962158, 2.7168843746185303, 2.8309848308563232, 2.945085287094116, 3.059185743331909, 3.1732864379882812]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 7.0, 9.0, 4.0, 5.0, 9.0, 11.0, 15.0, 29.0, 20.0, 45.0, 45.0, 49.0, 54.0, 53.0, 57.0, 60.0, 54.0, 58.0, 66.0, 42.0, 45.0, 47.0, 35.0, 29.0, 23.0, 10.0, 19.0, 15.0, 19.0, 21.0, 5.0, 13.0, 2.0, 7.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3247147798538208, -1.2860833406448364, -1.2474520206451416, -1.2088205814361572, -1.1701891422271729, -1.1315577030181885, -1.0929263830184937, -1.0542949438095093, -1.0156636238098145, -0.9770322442054749, -0.9384008049964905, -0.8997694253921509, -0.8611379861831665, -0.8225066065788269, -0.7838752269744873, -0.7452437877655029, -0.7066123485565186, -0.667980968952179, -0.6293495297431946, -0.590718150138855, -0.5520867109298706, -0.513455331325531, -0.4748239517211914, -0.4361925423145294, -0.39756113290786743, -0.35892972350120544, -0.32029831409454346, -0.28166693449020386, -0.24303552508354187, -0.20440411567687988, -0.1657727211713791, -0.1271413266658783, -0.08851003646850586, -0.04987863451242447, -0.011247232556343079, 0.027384169399738312, 0.0660155713558197, 0.10464698076248169, 0.14327837526798248, 0.18190976977348328, 0.22054117918014526, 0.25917258858680725, 0.29780399799346924, 0.33643537759780884, 0.3750667870044708, 0.4136981964111328, 0.4523295760154724, 0.4909609854221344, 0.5295923948287964, 0.568223774433136, 0.6068552136421204, 0.64548659324646, 0.6841180324554443, 0.7227494120597839, 0.7613807916641235, 0.8000122308731079, 0.8386436104774475, 0.8772749900817871, 0.9159064292907715, 0.9545378088951111, 0.9931691884994507, 1.031800627708435, 1.0704320669174194, 1.1090633869171143, 1.1476948261260986]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 2.0, 5.0, 4.0, 9.0, 8.0, 14.0, 18.0, 30.0, 37.0, 50.0, 95.0, 148.0, 256.0, 429.0, 794.0, 1563.0, 3264.0, 7900.0, 21247.0, 71944.0, 354205.0, 458317.0, 86806.0, 24890.0, 8904.0, 3762.0, 1779.0, 894.0, 477.0, 267.0, 139.0, 95.0, 72.0, 37.0, 31.0, 15.0, 11.0, 14.0, 7.0, 5.0, 1.0, 5.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.361328125, -1.322509765625, -1.28369140625, -1.244873046875, -1.2060546875, -1.167236328125, -1.12841796875, -1.089599609375, -1.05078125, -1.011962890625, -0.97314453125, -0.934326171875, -0.8955078125, -0.856689453125, -0.81787109375, -0.779052734375, -0.740234375, -0.701416015625, -0.66259765625, -0.623779296875, -0.5849609375, -0.546142578125, -0.50732421875, -0.468505859375, -0.4296875, -0.390869140625, -0.35205078125, -0.313232421875, -0.2744140625, -0.235595703125, -0.19677734375, -0.157958984375, -0.119140625, -0.080322265625, -0.04150390625, -0.002685546875, 0.0361328125, 0.074951171875, 0.11376953125, 0.152587890625, 0.19140625, 0.230224609375, 0.26904296875, 0.307861328125, 0.3466796875, 0.385498046875, 0.42431640625, 0.463134765625, 0.501953125, 0.540771484375, 0.57958984375, 0.618408203125, 0.6572265625, 0.696044921875, 0.73486328125, 0.773681640625, 0.8125, 0.851318359375, 0.89013671875, 0.928955078125, 0.9677734375, 1.006591796875, 1.04541015625, 1.084228515625, 1.123046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 9.0, 18.0, 12.0, 16.0, 10.0, 15.0, 19.0, 27.0, 32.0, 44.0, 41.0, 52.0, 61.0, 57.0, 60.0, 73.0, 58.0, 43.0, 43.0, 57.0, 35.0, 43.0, 30.0, 32.0, 16.0, 22.0, 10.0, 8.0, 14.0, 11.0, 5.0, 2.0, 5.0, 4.0, 1.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0], "bins": [-3.419921875, -3.330657958984375, -3.24139404296875, -3.152130126953125, -3.0628662109375, -2.973602294921875, -2.88433837890625, -2.795074462890625, -2.705810546875, -2.616546630859375, -2.52728271484375, -2.438018798828125, -2.3487548828125, -2.259490966796875, -2.17022705078125, -2.080963134765625, -1.99169921875, -1.902435302734375, -1.81317138671875, -1.723907470703125, -1.6346435546875, -1.545379638671875, -1.45611572265625, -1.366851806640625, -1.277587890625, -1.188323974609375, -1.09906005859375, -1.009796142578125, -0.9205322265625, -0.831268310546875, -0.74200439453125, -0.652740478515625, -0.5634765625, -0.474212646484375, -0.38494873046875, -0.295684814453125, -0.2064208984375, -0.117156982421875, -0.02789306640625, 0.061370849609375, 0.150634765625, 0.239898681640625, 0.32916259765625, 0.418426513671875, 0.5076904296875, 0.596954345703125, 0.68621826171875, 0.775482177734375, 0.86474609375, 0.954010009765625, 1.04327392578125, 1.132537841796875, 1.2218017578125, 1.311065673828125, 1.40032958984375, 1.489593505859375, 1.578857421875, 1.668121337890625, 1.75738525390625, 1.846649169921875, 1.9359130859375, 2.025177001953125, 2.11444091796875, 2.203704833984375, 2.29296875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 7.0, 5.0, 6.0, 3.0, 11.0, 13.0, 8.0, 11.0, 14.0, 16.0, 30.0, 37.0, 35.0, 31.0, 35.0, 34.0, 35.0, 42.0, 80.0, 677.0, 854934.0, 191594.0, 453.0, 81.0, 35.0, 49.0, 44.0, 32.0, 23.0, 29.0, 37.0, 16.0, 21.0, 24.0, 16.0, 13.0, 3.0, 6.0, 6.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.21875, -8.95489501953125, -8.6910400390625, -8.42718505859375, -8.163330078125, -7.89947509765625, -7.6356201171875, -7.37176513671875, -7.10791015625, -6.84405517578125, -6.5802001953125, -6.31634521484375, -6.052490234375, -5.78863525390625, -5.5247802734375, -5.26092529296875, -4.9970703125, -4.73321533203125, -4.4693603515625, -4.20550537109375, -3.941650390625, -3.67779541015625, -3.4139404296875, -3.15008544921875, -2.88623046875, -2.62237548828125, -2.3585205078125, -2.09466552734375, -1.830810546875, -1.56695556640625, -1.3031005859375, -1.03924560546875, -0.775390625, -0.51153564453125, -0.2476806640625, 0.01617431640625, 0.280029296875, 0.54388427734375, 0.8077392578125, 1.07159423828125, 1.33544921875, 1.59930419921875, 1.8631591796875, 2.12701416015625, 2.390869140625, 2.65472412109375, 2.9185791015625, 3.18243408203125, 3.4462890625, 3.71014404296875, 3.9739990234375, 4.23785400390625, 4.501708984375, 4.76556396484375, 5.0294189453125, 5.29327392578125, 5.55712890625, 5.82098388671875, 6.0848388671875, 6.34869384765625, 6.612548828125, 6.87640380859375, 7.1402587890625, 7.40411376953125, 7.66796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 8.0, 7.0, 5.0, 8.0, 11.0, 8.0, 12.0, 14.0, 19.0, 35.0, 32.0, 42.0, 30.0, 32.0, 31.0, 38.0, 46.0, 45.0, 44.0, 60.0, 39.0, 38.0, 37.0, 38.0, 33.0, 37.0, 37.0, 33.0, 36.0, 22.0, 25.0, 20.0, 15.0, 22.0, 15.0, 3.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.9765625, -2.891021728515625, -2.80548095703125, -2.719940185546875, -2.6343994140625, -2.548858642578125, -2.46331787109375, -2.377777099609375, -2.292236328125, -2.206695556640625, -2.12115478515625, -2.035614013671875, -1.9500732421875, -1.864532470703125, -1.77899169921875, -1.693450927734375, -1.60791015625, -1.522369384765625, -1.43682861328125, -1.351287841796875, -1.2657470703125, -1.180206298828125, -1.09466552734375, -1.009124755859375, -0.923583984375, -0.838043212890625, -0.75250244140625, -0.666961669921875, -0.5814208984375, -0.495880126953125, -0.41033935546875, -0.324798583984375, -0.2392578125, -0.153717041015625, -0.06817626953125, 0.017364501953125, 0.1029052734375, 0.188446044921875, 0.27398681640625, 0.359527587890625, 0.445068359375, 0.530609130859375, 0.61614990234375, 0.701690673828125, 0.7872314453125, 0.872772216796875, 0.95831298828125, 1.043853759765625, 1.12939453125, 1.214935302734375, 1.30047607421875, 1.386016845703125, 1.4715576171875, 1.557098388671875, 1.64263916015625, 1.728179931640625, 1.813720703125, 1.899261474609375, 1.98480224609375, 2.070343017578125, 2.1558837890625, 2.241424560546875, 2.32696533203125, 2.412506103515625, 2.498046875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 7.0, 18.0, 23.0, 37.0, 54.0, 82.0, 126.0, 232.0, 449.0, 832.0, 2053.0, 5649.0, 25278.0, 307525.0, 655078.0, 38707.0, 7563.0, 2500.0, 1101.0, 519.0, 293.0, 160.0, 80.0, 44.0, 44.0, 34.0, 11.0, 13.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73388671875, -0.7095108032226562, -0.6851348876953125, -0.6607589721679688, -0.636383056640625, -0.6120071411132812, -0.5876312255859375, -0.5632553100585938, -0.53887939453125, -0.5145034790039062, -0.4901275634765625, -0.46575164794921875, -0.441375732421875, -0.41699981689453125, -0.3926239013671875, -0.36824798583984375, -0.3438720703125, -0.31949615478515625, -0.2951202392578125, -0.27074432373046875, -0.246368408203125, -0.22199249267578125, -0.1976165771484375, -0.17324066162109375, -0.14886474609375, -0.12448883056640625, -0.1001129150390625, -0.07573699951171875, -0.051361083984375, -0.02698516845703125, -0.0026092529296875, 0.02176666259765625, 0.046142578125, 0.07051849365234375, 0.0948944091796875, 0.11927032470703125, 0.143646240234375, 0.16802215576171875, 0.1923980712890625, 0.21677398681640625, 0.24114990234375, 0.26552581787109375, 0.2899017333984375, 0.31427764892578125, 0.338653564453125, 0.36302947998046875, 0.3874053955078125, 0.41178131103515625, 0.4361572265625, 0.46053314208984375, 0.4849090576171875, 0.5092849731445312, 0.533660888671875, 0.5580368041992188, 0.5824127197265625, 0.6067886352539062, 0.63116455078125, 0.6555404663085938, 0.6799163818359375, 0.7042922973632812, 0.728668212890625, 0.7530441284179688, 0.7774200439453125, 0.8017959594726562, 0.826171875]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 2.0, 6.0, 9.0, 8.0, 15.0, 16.0, 38.0, 43.0, 72.0, 141.0, 199.0, 145.0, 109.0, 61.0, 33.0, 38.0, 14.0, 19.0, 8.0, 3.0, 3.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0001399517059326172, -0.00013592466711997986, -0.00013189762830734253, -0.0001278705894947052, -0.00012384355068206787, -0.00011981651186943054, -0.00011578947305679321, -0.00011176243424415588, -0.00010773539543151855, -0.00010370835661888123, -9.96813178062439e-05, -9.565427899360657e-05, -9.162724018096924e-05, -8.760020136833191e-05, -8.357316255569458e-05, -7.954612374305725e-05, -7.551908493041992e-05, -7.149204611778259e-05, -6.746500730514526e-05, -6.343796849250793e-05, -5.9410929679870605e-05, -5.5383890867233276e-05, -5.135685205459595e-05, -4.732981324195862e-05, -4.330277442932129e-05, -3.927573561668396e-05, -3.524869680404663e-05, -3.12216579914093e-05, -2.7194619178771973e-05, -2.3167580366134644e-05, -1.9140541553497314e-05, -1.5113502740859985e-05, -1.1086463928222656e-05, -7.059425115585327e-06, -3.032386302947998e-06, 9.94652509689331e-07, 5.02169132232666e-06, 9.04873013496399e-06, 1.3075768947601318e-05, 1.7102807760238647e-05, 2.1129846572875977e-05, 2.5156885385513306e-05, 2.9183924198150635e-05, 3.3210963010787964e-05, 3.723800182342529e-05, 4.126504063606262e-05, 4.529207944869995e-05, 4.931911826133728e-05, 5.334615707397461e-05, 5.737319588661194e-05, 6.140023469924927e-05, 6.54272735118866e-05, 6.945431232452393e-05, 7.348135113716125e-05, 7.750838994979858e-05, 8.153542876243591e-05, 8.556246757507324e-05, 8.958950638771057e-05, 9.36165452003479e-05, 9.764358401298523e-05, 0.00010167062282562256, 0.00010569766163825989, 0.00010972470045089722, 0.00011375173926353455, 0.00011777877807617188]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 6.0, 9.0, 6.0, 12.0, 8.0, 16.0, 29.0, 35.0, 45.0, 82.0, 107.0, 226.0, 338.0, 727.0, 1469.0, 3319.0, 9574.0, 39787.0, 297847.0, 609315.0, 63743.0, 13805.0, 4344.0, 1761.0, 875.0, 425.0, 233.0, 151.0, 82.0, 43.0, 32.0, 32.0, 17.0, 15.0, 15.0, 13.0, 6.0, 1.0, 7.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5771484375, -0.56024169921875, -0.5433349609375, -0.52642822265625, -0.509521484375, -0.49261474609375, -0.4757080078125, -0.45880126953125, -0.44189453125, -0.42498779296875, -0.4080810546875, -0.39117431640625, -0.374267578125, -0.35736083984375, -0.3404541015625, -0.32354736328125, -0.306640625, -0.28973388671875, -0.2728271484375, -0.25592041015625, -0.239013671875, -0.22210693359375, -0.2052001953125, -0.18829345703125, -0.17138671875, -0.15447998046875, -0.1375732421875, -0.12066650390625, -0.103759765625, -0.08685302734375, -0.0699462890625, -0.05303955078125, -0.0361328125, -0.01922607421875, -0.0023193359375, 0.01458740234375, 0.031494140625, 0.04840087890625, 0.0653076171875, 0.08221435546875, 0.09912109375, 0.11602783203125, 0.1329345703125, 0.14984130859375, 0.166748046875, 0.18365478515625, 0.2005615234375, 0.21746826171875, 0.234375, 0.25128173828125, 0.2681884765625, 0.28509521484375, 0.302001953125, 0.31890869140625, 0.3358154296875, 0.35272216796875, 0.36962890625, 0.38653564453125, 0.4034423828125, 0.42034912109375, 0.437255859375, 0.45416259765625, 0.4710693359375, 0.48797607421875, 0.5048828125]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 8.0, 1.0, 11.0, 13.0, 20.0, 22.0, 29.0, 27.0, 38.0, 54.0, 71.0, 105.0, 129.0, 116.0, 84.0, 64.0, 45.0, 41.0, 26.0, 20.0, 13.0, 10.0, 16.0, 11.0, 11.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.22705078125, -0.2201061248779297, -0.21316146850585938, -0.20621681213378906, -0.19927215576171875, -0.19232749938964844, -0.18538284301757812, -0.1784381866455078, -0.1714935302734375, -0.1645488739013672, -0.15760421752929688, -0.15065956115722656, -0.14371490478515625, -0.13677024841308594, -0.12982559204101562, -0.12288093566894531, -0.115936279296875, -0.10899162292480469, -0.10204696655273438, -0.09510231018066406, -0.08815765380859375, -0.08121299743652344, -0.07426834106445312, -0.06732368469238281, -0.0603790283203125, -0.05343437194824219, -0.046489715576171875, -0.03954505920410156, -0.03260040283203125, -0.025655746459960938, -0.018711090087890625, -0.011766433715820312, -0.00482177734375, 0.0021228790283203125, 0.009067535400390625, 0.016012191772460938, 0.02295684814453125, 0.029901504516601562, 0.036846160888671875, 0.04379081726074219, 0.0507354736328125, 0.05768013000488281, 0.06462478637695312, 0.07156944274902344, 0.07851409912109375, 0.08545875549316406, 0.09240341186523438, 0.09934806823730469, 0.106292724609375, 0.11323738098144531, 0.12018203735351562, 0.12712669372558594, 0.13407135009765625, 0.14101600646972656, 0.14796066284179688, 0.1549053192138672, 0.1618499755859375, 0.1687946319580078, 0.17573928833007812, 0.18268394470214844, 0.18962860107421875, 0.19657325744628906, 0.20351791381835938, 0.2104625701904297, 0.2174072265625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 14.0, 27.0, 58.0, 239.0, 429.0, 153.0, 47.0, 19.0, 11.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8340229988098145, -4.407226085662842, -3.980429172515869, -3.5536322593688965, -3.126835346221924, -2.7000386714935303, -2.2732417583465576, -1.846444845199585, -1.4196479320526123, -0.9928510189056396, -0.5660541653633118, -0.1392573118209839, 0.28753960132598877, 0.7143363952636719, 1.1411333084106445, 1.5679302215576172, 1.9947271347045898, 2.4215240478515625, 2.848320960998535, 3.275117874145508, 3.7019147872924805, 4.128711700439453, 4.555508613586426, 4.982305526733398, 5.409102439880371, 5.835899353027344, 6.262696266174316, 6.689493179321289, 7.116290092468262, 7.543087005615234, 7.969883918762207, 8.39668083190918, 8.823477745056152, 9.250274658203125, 9.677071571350098, 10.10386848449707, 10.530665397644043, 10.957462310791016, 11.384259223937988, 11.811056137084961, 12.237853050231934, 12.664649963378906, 13.091446876525879, 13.518243789672852, 13.945040702819824, 14.371837615966797, 14.79863452911377, 15.225431442260742, 15.652227401733398, 16.079023361206055, 16.505821228027344, 16.9326171875, 17.35941505432129, 17.786211013793945, 18.213008880615234, 18.63980484008789, 19.06660270690918, 19.493398666381836, 19.920196533203125, 20.34699249267578, 20.77379035949707, 21.200586318969727, 21.627384185791016, 22.054180145263672, 22.48097801208496]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 7.0, 2.0, 14.0, 9.0, 9.0, 30.0, 15.0, 23.0, 39.0, 48.0, 45.0, 46.0, 37.0, 59.0, 56.0, 69.0, 66.0, 56.0, 55.0, 57.0, 53.0, 46.0, 34.0, 40.0, 21.0, 15.0, 14.0, 7.0, 14.0, 8.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.458180904388428, -6.271032810211182, -6.0838847160339355, -5.8967366218566895, -5.709588050842285, -5.522439956665039, -5.335291862487793, -5.148143768310547, -4.960995674133301, -4.773847579956055, -4.586699485778809, -4.3995513916015625, -4.212403297424316, -4.025254726409912, -3.838106632232666, -3.65095853805542, -3.463810443878174, -3.2766623497009277, -3.0895142555236816, -2.9023659229278564, -2.7152178287506104, -2.5280697345733643, -2.340921401977539, -2.153773307800293, -1.9666252136230469, -1.7794771194458008, -1.5923289060592651, -1.4051806926727295, -1.2180325984954834, -1.0308845043182373, -0.8437362909317017, -0.656588077545166, -0.4694399833679199, -0.28229182958602905, -0.09514367580413818, 0.09200447797775269, 0.27915263175964355, 0.4663007855415344, 0.6534489393234253, 0.8405971527099609, 1.027745246887207, 1.2148933410644531, 1.4020415544509888, 1.5891897678375244, 1.7763378620147705, 1.9634859561920166, 2.150634288787842, 2.337782382965088, 2.524930477142334, 2.71207857131958, 2.899226665496826, 3.0863749980926514, 3.2735230922698975, 3.4606711864471436, 3.6478195190429688, 3.834967613220215, 4.022115707397461, 4.209263801574707, 4.396411895751953, 4.583559989929199, 4.770708084106445, 4.95785665512085, 5.145004749298096, 5.332152843475342, 5.519300937652588]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 9.0, 4.0, 7.0, 9.0, 12.0, 18.0, 39.0, 58.0, 95.0, 198.0, 448.0, 1126.0, 3983.0, 22101.0, 374345.0, 3678009.0, 99011.0, 11015.0, 2406.0, 756.0, 324.0, 145.0, 74.0, 38.0, 22.0, 11.0, 8.0, 3.0, 4.0, 1.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.08984375, -4.960357666015625, -4.83087158203125, -4.701385498046875, -4.5718994140625, -4.442413330078125, -4.31292724609375, -4.183441162109375, -4.053955078125, -3.924468994140625, -3.79498291015625, -3.665496826171875, -3.5360107421875, -3.406524658203125, -3.27703857421875, -3.147552490234375, -3.01806640625, -2.888580322265625, -2.75909423828125, -2.629608154296875, -2.5001220703125, -2.370635986328125, -2.24114990234375, -2.111663818359375, -1.982177734375, -1.852691650390625, -1.72320556640625, -1.593719482421875, -1.4642333984375, -1.334747314453125, -1.20526123046875, -1.075775146484375, -0.9462890625, -0.816802978515625, -0.68731689453125, -0.557830810546875, -0.4283447265625, -0.298858642578125, -0.16937255859375, -0.039886474609375, 0.089599609375, 0.219085693359375, 0.34857177734375, 0.478057861328125, 0.6075439453125, 0.737030029296875, 0.86651611328125, 0.996002197265625, 1.12548828125, 1.254974365234375, 1.38446044921875, 1.513946533203125, 1.6434326171875, 1.772918701171875, 1.90240478515625, 2.031890869140625, 2.161376953125, 2.290863037109375, 2.42034912109375, 2.549835205078125, 2.6793212890625, 2.808807373046875, 2.93829345703125, 3.067779541015625, 3.197265625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 1.0, 4.0, 2.0, 7.0, 3.0, 4.0, 4.0, 9.0, 9.0, 21.0, 14.0, 18.0, 18.0, 31.0, 33.0, 46.0, 49.0, 60.0, 61.0, 51.0, 72.0, 52.0, 53.0, 58.0, 50.0, 39.0, 36.0, 27.0, 24.0, 16.0, 15.0, 19.0, 13.0, 17.0, 17.0, 12.0, 8.0, 2.0, 6.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4296875, -1.3863525390625, -1.343017578125, -1.2996826171875, -1.25634765625, -1.2130126953125, -1.169677734375, -1.1263427734375, -1.0830078125, -1.0396728515625, -0.996337890625, -0.9530029296875, -0.90966796875, -0.8663330078125, -0.822998046875, -0.7796630859375, -0.736328125, -0.6929931640625, -0.649658203125, -0.6063232421875, -0.56298828125, -0.5196533203125, -0.476318359375, -0.4329833984375, -0.3896484375, -0.3463134765625, -0.302978515625, -0.2596435546875, -0.21630859375, -0.1729736328125, -0.129638671875, -0.0863037109375, -0.04296875, 0.0003662109375, 0.043701171875, 0.0870361328125, 0.13037109375, 0.1737060546875, 0.217041015625, 0.2603759765625, 0.3037109375, 0.3470458984375, 0.390380859375, 0.4337158203125, 0.47705078125, 0.5203857421875, 0.563720703125, 0.6070556640625, 0.650390625, 0.6937255859375, 0.737060546875, 0.7803955078125, 0.82373046875, 0.8670654296875, 0.910400390625, 0.9537353515625, 0.9970703125, 1.0404052734375, 1.083740234375, 1.1270751953125, 1.17041015625, 1.2137451171875, 1.257080078125, 1.3004150390625, 1.34375]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 5.0, 4.0, 9.0, 12.0, 13.0, 23.0, 39.0, 74.0, 162.0, 318.0, 1010.0, 4896.0, 77196.0, 4029152.0, 74834.0, 4925.0, 958.0, 322.0, 137.0, 66.0, 44.0, 27.0, 15.0, 11.0, 7.0, 5.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3671875, -7.17578125, -6.984375, -6.79296875, -6.6015625, -6.41015625, -6.21875, -6.02734375, -5.8359375, -5.64453125, -5.453125, -5.26171875, -5.0703125, -4.87890625, -4.6875, -4.49609375, -4.3046875, -4.11328125, -3.921875, -3.73046875, -3.5390625, -3.34765625, -3.15625, -2.96484375, -2.7734375, -2.58203125, -2.390625, -2.19921875, -2.0078125, -1.81640625, -1.625, -1.43359375, -1.2421875, -1.05078125, -0.859375, -0.66796875, -0.4765625, -0.28515625, -0.09375, 0.09765625, 0.2890625, 0.48046875, 0.671875, 0.86328125, 1.0546875, 1.24609375, 1.4375, 1.62890625, 1.8203125, 2.01171875, 2.203125, 2.39453125, 2.5859375, 2.77734375, 2.96875, 3.16015625, 3.3515625, 3.54296875, 3.734375, 3.92578125, 4.1171875, 4.30859375, 4.5, 4.69140625, 4.8828125]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 8.0, 7.0, 5.0, 12.0, 13.0, 21.0, 21.0, 26.0, 27.0, 39.0, 37.0, 64.0, 96.0, 99.0, 136.0, 170.0, 263.0, 475.0, 875.0, 537.0, 321.0, 212.0, 142.0, 110.0, 70.0, 75.0, 49.0, 37.0, 18.0, 20.0, 18.0, 12.0, 10.0, 10.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.55712890625, -0.5418930053710938, -0.5266571044921875, -0.5114212036132812, -0.496185302734375, -0.48094940185546875, -0.4657135009765625, -0.45047760009765625, -0.43524169921875, -0.42000579833984375, -0.4047698974609375, -0.38953399658203125, -0.374298095703125, -0.35906219482421875, -0.3438262939453125, -0.32859039306640625, -0.3133544921875, -0.29811859130859375, -0.2828826904296875, -0.26764678955078125, -0.252410888671875, -0.23717498779296875, -0.2219390869140625, -0.20670318603515625, -0.19146728515625, -0.17623138427734375, -0.1609954833984375, -0.14575958251953125, -0.130523681640625, -0.11528778076171875, -0.1000518798828125, -0.08481597900390625, -0.069580078125, -0.05434417724609375, -0.0391082763671875, -0.02387237548828125, -0.008636474609375, 0.00659942626953125, 0.0218353271484375, 0.03707122802734375, 0.05230712890625, 0.06754302978515625, 0.0827789306640625, 0.09801483154296875, 0.113250732421875, 0.12848663330078125, 0.1437225341796875, 0.15895843505859375, 0.1741943359375, 0.18943023681640625, 0.2046661376953125, 0.21990203857421875, 0.235137939453125, 0.25037384033203125, 0.2656097412109375, 0.28084564208984375, 0.29608154296875, 0.31131744384765625, 0.3265533447265625, 0.34178924560546875, 0.357025146484375, 0.37226104736328125, 0.3874969482421875, 0.40273284912109375, 0.41796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 2.0, 10.0, 5.0, 11.0, 10.0, 17.0, 21.0, 38.0, 72.0, 108.0, 140.0, 172.0, 142.0, 101.0, 54.0, 31.0, 17.0, 13.0, 9.0, 6.0, 9.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.207167625427246, -3.095102310180664, -2.983036756515503, -2.870971202850342, -2.7589058876037598, -2.6468405723571777, -2.5347750186920166, -2.4227094650268555, -2.3106441497802734, -2.1985788345336914, -2.0865132808685303, -1.9744478464126587, -1.862382411956787, -1.7503169775009155, -1.638251543045044, -1.5261861085891724, -1.4141206741333008, -1.3020552396774292, -1.1899898052215576, -1.077924370765686, -0.9658589363098145, -0.8537935018539429, -0.7417280673980713, -0.6296626329421997, -0.5175971984863281, -0.40553176403045654, -0.29346632957458496, -0.18140089511871338, -0.0693354606628418, 0.042729973793029785, 0.15479540824890137, 0.26686084270477295, 0.37892627716064453, 0.4909917116165161, 0.6030571460723877, 0.7151225805282593, 0.8271880149841309, 0.9392534494400024, 1.051318883895874, 1.1633843183517456, 1.2754497528076172, 1.3875151872634888, 1.4995806217193604, 1.611646056175232, 1.7237114906311035, 1.835776925086975, 1.9478423595428467, 2.059907913208008, 2.17197322845459, 2.284038543701172, 2.396104097366333, 2.508169651031494, 2.620234966278076, 2.732300281524658, 2.8443658351898193, 2.9564313888549805, 3.0684967041015625, 3.1805620193481445, 3.2926275730133057, 3.404693126678467, 3.516758441925049, 3.628823757171631, 3.740889310836792, 3.852954864501953, 3.965020179748535]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 2.0, 5.0, 2.0, 4.0, 9.0, 9.0, 10.0, 13.0, 16.0, 24.0, 22.0, 25.0, 37.0, 28.0, 38.0, 35.0, 54.0, 49.0, 46.0, 45.0, 59.0, 49.0, 40.0, 43.0, 43.0, 45.0, 39.0, 32.0, 29.0, 18.0, 20.0, 23.0, 19.0, 19.0, 10.0, 6.0, 10.0, 8.0, 6.0, 1.0, 3.0, 5.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.6754878759384155, -1.627683401107788, -1.5798790454864502, -1.5320745706558228, -1.4842700958251953, -1.4364656209945679, -1.3886611461639404, -1.3408567905426025, -1.293052315711975, -1.2452478408813477, -1.1974434852600098, -1.1496390104293823, -1.1018345355987549, -1.0540300607681274, -1.0062255859375, -0.9584212303161621, -0.9106167554855347, -0.8628122806549072, -0.8150078654289246, -0.7672034502029419, -0.7193989753723145, -0.671594500541687, -0.6237900853157043, -0.5759856700897217, -0.5281811952590942, -0.4803767502307892, -0.43257230520248413, -0.3847678601741791, -0.336963415145874, -0.28915897011756897, -0.24135452508926392, -0.19355008006095886, -0.14574551582336426, -0.0979410707950592, -0.05013662576675415, -0.0023321807384490967, 0.04547226428985596, 0.09327670931816101, 0.14108115434646606, 0.18888559937477112, 0.23669004440307617, 0.2844944894313812, 0.3322989344596863, 0.38010337948799133, 0.4279078245162964, 0.47571226954460144, 0.5235167145729065, 0.5713211297988892, 0.6191256046295166, 0.666930079460144, 0.7147344946861267, 0.7625389099121094, 0.8103433847427368, 0.8581478595733643, 0.9059522747993469, 0.9537566900253296, 1.001561164855957, 1.0493656396865845, 1.097170114517212, 1.1449744701385498, 1.1927789449691772, 1.2405834197998047, 1.2883877754211426, 1.33619225025177, 1.3839967250823975]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 3.0, 1.0, 1.0, 5.0, 6.0, 6.0, 9.0, 12.0, 13.0, 23.0, 33.0, 46.0, 58.0, 94.0, 130.0, 256.0, 376.0, 799.0, 1954.0, 6571.0, 44193.0, 749175.0, 222094.0, 16462.0, 3549.0, 1246.0, 533.0, 327.0, 172.0, 134.0, 70.0, 53.0, 32.0, 30.0, 19.0, 21.0, 16.0, 7.0, 4.0, 4.0, 2.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.3271484375, -0.3168525695800781, -0.30655670166015625, -0.2962608337402344, -0.2859649658203125, -0.2756690979003906, -0.26537322998046875, -0.2550773620605469, -0.244781494140625, -0.23448562622070312, -0.22418975830078125, -0.21389389038085938, -0.2035980224609375, -0.19330215454101562, -0.18300628662109375, -0.17271041870117188, -0.16241455078125, -0.15211868286132812, -0.14182281494140625, -0.13152694702148438, -0.1212310791015625, -0.11093521118164062, -0.10063934326171875, -0.09034347534179688, -0.080047607421875, -0.06975173950195312, -0.05945587158203125, -0.049160003662109375, -0.0388641357421875, -0.028568267822265625, -0.01827239990234375, -0.007976531982421875, 0.0023193359375, 0.012615203857421875, 0.02291107177734375, 0.033206939697265625, 0.0435028076171875, 0.053798675537109375, 0.06409454345703125, 0.07439041137695312, 0.084686279296875, 0.09498214721679688, 0.10527801513671875, 0.11557388305664062, 0.1258697509765625, 0.13616561889648438, 0.14646148681640625, 0.15675735473632812, 0.16705322265625, 0.17734909057617188, 0.18764495849609375, 0.19794082641601562, 0.2082366943359375, 0.21853256225585938, 0.22882843017578125, 0.23912429809570312, 0.249420166015625, 0.2597160339355469, 0.27001190185546875, 0.2803077697753906, 0.2906036376953125, 0.3008995056152344, 0.31119537353515625, 0.3214912414550781, 0.331787109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 1.0, 1.0, 3.0, 7.0, 2.0, 8.0, 9.0, 7.0, 10.0, 17.0, 24.0, 14.0, 21.0, 29.0, 32.0, 40.0, 54.0, 57.0, 42.0, 57.0, 57.0, 52.0, 56.0, 46.0, 49.0, 39.0, 43.0, 37.0, 32.0, 28.0, 17.0, 25.0, 15.0, 10.0, 12.0, 10.0, 11.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.0732421875, -1.0401611328125, -1.007080078125, -0.9739990234375, -0.94091796875, -0.9078369140625, -0.874755859375, -0.8416748046875, -0.80859375, -0.7755126953125, -0.742431640625, -0.7093505859375, -0.67626953125, -0.6431884765625, -0.610107421875, -0.5770263671875, -0.5439453125, -0.5108642578125, -0.477783203125, -0.4447021484375, -0.41162109375, -0.3785400390625, -0.345458984375, -0.3123779296875, -0.279296875, -0.2462158203125, -0.213134765625, -0.1800537109375, -0.14697265625, -0.1138916015625, -0.080810546875, -0.0477294921875, -0.0146484375, 0.0184326171875, 0.051513671875, 0.0845947265625, 0.11767578125, 0.1507568359375, 0.183837890625, 0.2169189453125, 0.25, 0.2830810546875, 0.316162109375, 0.3492431640625, 0.38232421875, 0.4154052734375, 0.448486328125, 0.4815673828125, 0.5146484375, 0.5477294921875, 0.580810546875, 0.6138916015625, 0.64697265625, 0.6800537109375, 0.713134765625, 0.7462158203125, 0.779296875, 0.8123779296875, 0.845458984375, 0.8785400390625, 0.91162109375, 0.9447021484375, 0.977783203125, 1.0108642578125, 1.0439453125]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 5.0, 8.0, 11.0, 13.0, 26.0, 32.0, 39.0, 58.0, 75.0, 96.0, 144.0, 202.0, 320.0, 589.0, 1656.0, 7219.0, 77036.0, 803060.0, 142335.0, 11705.0, 2032.0, 707.0, 381.0, 206.0, 180.0, 104.0, 86.0, 56.0, 45.0, 31.0, 26.0, 17.0, 5.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1795654296875, -0.17305946350097656, -0.16655349731445312, -0.1600475311279297, -0.15354156494140625, -0.1470355987548828, -0.14052963256835938, -0.13402366638183594, -0.1275177001953125, -0.12101173400878906, -0.11450576782226562, -0.10799980163574219, -0.10149383544921875, -0.09498786926269531, -0.08848190307617188, -0.08197593688964844, -0.075469970703125, -0.06896400451660156, -0.062458038330078125, -0.05595207214355469, -0.04944610595703125, -0.04294013977050781, -0.036434173583984375, -0.029928207397460938, -0.0234222412109375, -0.016916275024414062, -0.010410308837890625, -0.0039043426513671875, 0.00260162353515625, 0.009107589721679688, 0.015613555908203125, 0.022119522094726562, 0.02862548828125, 0.03513145446777344, 0.041637420654296875, 0.04814338684082031, 0.05464935302734375, 0.06115531921386719, 0.06766128540039062, 0.07416725158691406, 0.0806732177734375, 0.08717918395996094, 0.09368515014648438, 0.10019111633300781, 0.10669708251953125, 0.11320304870605469, 0.11970901489257812, 0.12621498107910156, 0.132720947265625, 0.13922691345214844, 0.14573287963867188, 0.1522388458251953, 0.15874481201171875, 0.1652507781982422, 0.17175674438476562, 0.17826271057128906, 0.1847686767578125, 0.19127464294433594, 0.19778060913085938, 0.2042865753173828, 0.21079254150390625, 0.2172985076904297, 0.22380447387695312, 0.23031044006347656, 0.23681640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 4.0, 9.0, 7.0, 4.0, 16.0, 10.0, 15.0, 10.0, 22.0, 23.0, 25.0, 28.0, 32.0, 44.0, 44.0, 43.0, 53.0, 51.0, 45.0, 55.0, 44.0, 41.0, 45.0, 40.0, 47.0, 38.0, 31.0, 29.0, 27.0, 24.0, 14.0, 15.0, 14.0, 8.0, 11.0, 9.0, 4.0, 10.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.6826171875, -1.63177490234375, -1.5809326171875, -1.53009033203125, -1.479248046875, -1.42840576171875, -1.3775634765625, -1.32672119140625, -1.27587890625, -1.22503662109375, -1.1741943359375, -1.12335205078125, -1.072509765625, -1.02166748046875, -0.9708251953125, -0.91998291015625, -0.869140625, -0.81829833984375, -0.7674560546875, -0.71661376953125, -0.665771484375, -0.61492919921875, -0.5640869140625, -0.51324462890625, -0.46240234375, -0.41156005859375, -0.3607177734375, -0.30987548828125, -0.259033203125, -0.20819091796875, -0.1573486328125, -0.10650634765625, -0.0556640625, -0.00482177734375, 0.0460205078125, 0.09686279296875, 0.147705078125, 0.19854736328125, 0.2493896484375, 0.30023193359375, 0.35107421875, 0.40191650390625, 0.4527587890625, 0.50360107421875, 0.554443359375, 0.60528564453125, 0.6561279296875, 0.70697021484375, 0.7578125, 0.80865478515625, 0.8594970703125, 0.91033935546875, 0.961181640625, 1.01202392578125, 1.0628662109375, 1.11370849609375, 1.16455078125, 1.21539306640625, 1.2662353515625, 1.31707763671875, 1.367919921875, 1.41876220703125, 1.4696044921875, 1.52044677734375, 1.5712890625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 1.0, 16.0, 16.0, 15.0, 31.0, 34.0, 24.0, 30.0, 48.0, 63.0, 80.0, 97.0, 125.0, 230.0, 347.0, 788.0, 2422.0, 13505.0, 720317.0, 297149.0, 9728.0, 1790.0, 606.0, 293.0, 194.0, 125.0, 85.0, 93.0, 62.0, 49.0, 37.0, 28.0, 31.0, 20.0, 11.0, 9.0, 10.0, 8.0, 8.0, 3.0, 8.0, 3.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.05755615234375, -0.05556678771972656, -0.053577423095703125, -0.05158805847167969, -0.04959869384765625, -0.04760932922363281, -0.045619964599609375, -0.04363059997558594, -0.0416412353515625, -0.03965187072753906, -0.037662506103515625, -0.03567314147949219, -0.03368377685546875, -0.03169441223144531, -0.029705047607421875, -0.027715682983398438, -0.025726318359375, -0.023736953735351562, -0.021747589111328125, -0.019758224487304688, -0.01776885986328125, -0.015779495239257812, -0.013790130615234375, -0.011800765991210938, -0.0098114013671875, -0.007822036743164062, -0.005832672119140625, -0.0038433074951171875, -0.00185394287109375, 0.0001354217529296875, 0.002124786376953125, 0.0041141510009765625, 0.006103515625, 0.008092880249023438, 0.010082244873046875, 0.012071609497070312, 0.01406097412109375, 0.016050338745117188, 0.018039703369140625, 0.020029067993164062, 0.0220184326171875, 0.024007797241210938, 0.025997161865234375, 0.027986526489257812, 0.02997589111328125, 0.03196525573730469, 0.033954620361328125, 0.03594398498535156, 0.037933349609375, 0.03992271423339844, 0.041912078857421875, 0.04390144348144531, 0.04589080810546875, 0.04788017272949219, 0.049869537353515625, 0.05185890197753906, 0.0538482666015625, 0.05583763122558594, 0.057826995849609375, 0.05981636047363281, 0.06180572509765625, 0.06379508972167969, 0.06578445434570312, 0.06777381896972656, 0.06976318359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 4.0, 5.0, 4.0, 8.0, 9.0, 15.0, 20.0, 28.0, 42.0, 65.0, 89.0, 102.0, 114.0, 110.0, 88.0, 77.0, 51.0, 45.0, 29.0, 22.0, 17.0, 13.0, 10.0, 10.0, 8.0, 4.0, 2.0, 5.0, 4.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0], "bins": [-3.039836883544922e-05, -2.9678456485271454e-05, -2.895854413509369e-05, -2.8238631784915924e-05, -2.751871943473816e-05, -2.6798807084560394e-05, -2.607889473438263e-05, -2.5358982384204865e-05, -2.46390700340271e-05, -2.3919157683849335e-05, -2.319924533367157e-05, -2.2479332983493805e-05, -2.175942063331604e-05, -2.1039508283138275e-05, -2.031959593296051e-05, -1.9599683582782745e-05, -1.887977123260498e-05, -1.8159858882427216e-05, -1.743994653224945e-05, -1.6720034182071686e-05, -1.600012183189392e-05, -1.5280209481716156e-05, -1.4560297131538391e-05, -1.3840384781360626e-05, -1.3120472431182861e-05, -1.2400560081005096e-05, -1.1680647730827332e-05, -1.0960735380649567e-05, -1.0240823030471802e-05, -9.520910680294037e-06, -8.800998330116272e-06, -8.081085979938507e-06, -7.361173629760742e-06, -6.641261279582977e-06, -5.921348929405212e-06, -5.2014365792274475e-06, -4.481524229049683e-06, -3.7616118788719177e-06, -3.041699528694153e-06, -2.321787178516388e-06, -1.601874828338623e-06, -8.819624781608582e-07, -1.6205012798309326e-07, 5.578622221946716e-07, 1.2777745723724365e-06, 1.9976869225502014e-06, 2.7175992727279663e-06, 3.437511622905731e-06, 4.157423973083496e-06, 4.877336323261261e-06, 5.597248673439026e-06, 6.317161023616791e-06, 7.037073373794556e-06, 7.75698572397232e-06, 8.476898074150085e-06, 9.19681042432785e-06, 9.916722774505615e-06, 1.063663512468338e-05, 1.1356547474861145e-05, 1.207645982503891e-05, 1.2796372175216675e-05, 1.351628452539444e-05, 1.4236196875572205e-05, 1.495610922574997e-05, 1.5676021575927734e-05]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 5.0, 14.0, 16.0, 12.0, 26.0, 40.0, 62.0, 89.0, 177.0, 338.0, 654.0, 1383.0, 3830.0, 14017.0, 119796.0, 860012.0, 36514.0, 7164.0, 2417.0, 895.0, 480.0, 236.0, 137.0, 73.0, 55.0, 27.0, 22.0, 17.0, 10.0, 13.0, 5.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.08740234375, -0.08485221862792969, -0.08230209350585938, -0.07975196838378906, -0.07720184326171875, -0.07465171813964844, -0.07210159301757812, -0.06955146789550781, -0.0670013427734375, -0.06445121765136719, -0.061901092529296875, -0.05935096740722656, -0.05680084228515625, -0.05425071716308594, -0.051700592041015625, -0.04915046691894531, -0.046600341796875, -0.04405021667480469, -0.041500091552734375, -0.03894996643066406, -0.03639984130859375, -0.03384971618652344, -0.031299591064453125, -0.028749465942382812, -0.0261993408203125, -0.023649215698242188, -0.021099090576171875, -0.018548965454101562, -0.01599884033203125, -0.013448715209960938, -0.010898590087890625, -0.008348464965820312, -0.00579833984375, -0.0032482147216796875, -0.000698089599609375, 0.0018520355224609375, 0.00440216064453125, 0.0069522857666015625, 0.009502410888671875, 0.012052536010742188, 0.0146026611328125, 0.017152786254882812, 0.019702911376953125, 0.022253036499023438, 0.02480316162109375, 0.027353286743164062, 0.029903411865234375, 0.03245353698730469, 0.035003662109375, 0.03755378723144531, 0.040103912353515625, 0.04265403747558594, 0.04520416259765625, 0.04775428771972656, 0.050304412841796875, 0.05285453796386719, 0.0554046630859375, 0.05795478820800781, 0.060504913330078125, 0.06305503845214844, 0.06560516357421875, 0.06815528869628906, 0.07070541381835938, 0.07325553894042969, 0.0758056640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 3.0, 3.0, 4.0, 10.0, 3.0, 14.0, 10.0, 14.0, 22.0, 39.0, 66.0, 98.0, 161.0, 210.0, 125.0, 67.0, 26.0, 24.0, 24.0, 13.0, 13.0, 7.0, 4.0, 11.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01253509521484375, -0.012157917022705078, -0.011780738830566406, -0.011403560638427734, -0.011026382446289062, -0.01064920425415039, -0.010272026062011719, -0.009894847869873047, -0.009517669677734375, -0.009140491485595703, -0.008763313293457031, -0.00838613510131836, -0.008008956909179688, -0.007631778717041016, -0.007254600524902344, -0.006877422332763672, -0.006500244140625, -0.006123065948486328, -0.005745887756347656, -0.005368709564208984, -0.0049915313720703125, -0.004614353179931641, -0.004237174987792969, -0.003859996795654297, -0.003482818603515625, -0.003105640411376953, -0.0027284622192382812, -0.0023512840270996094, -0.0019741058349609375, -0.0015969276428222656, -0.0012197494506835938, -0.0008425712585449219, -0.00046539306640625, -8.821487426757812e-05, 0.00028896331787109375, 0.0006661415100097656, 0.0010433197021484375, 0.0014204978942871094, 0.0017976760864257812, 0.002174854278564453, 0.002552032470703125, 0.002929210662841797, 0.0033063888549804688, 0.0036835670471191406, 0.0040607452392578125, 0.004437923431396484, 0.004815101623535156, 0.005192279815673828, 0.0055694580078125, 0.005946636199951172, 0.006323814392089844, 0.006700992584228516, 0.0070781707763671875, 0.007455348968505859, 0.007832527160644531, 0.008209705352783203, 0.008586883544921875, 0.008964061737060547, 0.009341239929199219, 0.00971841812133789, 0.010095596313476562, 0.010472774505615234, 0.010849952697753906, 0.011227130889892578, 0.01160430908203125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 4.0, 6.0, 4.0, 7.0, 13.0, 16.0, 22.0, 33.0, 76.0, 161.0, 208.0, 197.0, 104.0, 67.0, 21.0, 20.0, 12.0, 11.0, 7.0, 2.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3700778484344482, -2.281541585922241, -2.1930055618286133, -2.1044692993164062, -2.015933036804199, -1.9273970127105713, -1.8388607501983643, -1.7503246068954468, -1.6617884635925293, -1.5732523202896118, -1.4847161769866943, -1.3961799144744873, -1.3076437711715698, -1.2191076278686523, -1.1305713653564453, -1.0420352220535278, -0.9534990787506104, -0.8649629354476929, -0.7764267325401306, -0.6878905296325684, -0.5993543863296509, -0.5108182430267334, -0.42228204011917114, -0.3337458372116089, -0.2452096939086914, -0.15667352080345154, -0.06813734769821167, 0.020398825407028198, 0.10893499851226807, 0.19747117161750793, 0.2860073447227478, 0.37454354763031006, 0.46307945251464844, 0.5516155958175659, 0.6401517987251282, 0.7286880016326904, 0.8172241449356079, 0.9057602882385254, 0.9942964911460876, 1.08283269405365, 1.1713688373565674, 1.2599049806594849, 1.3484411239624023, 1.4369773864746094, 1.5255135297775269, 1.6140496730804443, 1.7025859355926514, 1.7911220788955688, 1.8796582221984863, 1.9681943655014038, 2.0567305088043213, 2.1452667713165283, 2.2338027954101562, 2.3223390579223633, 2.4108753204345703, 2.4994115829467773, 2.5879476070404053, 2.6764838695526123, 2.7650198936462402, 2.8535561561584473, 2.9420924186706543, 3.0306284427642822, 3.1191647052764893, 3.207700729370117, 3.296236991882324]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 5.0, 4.0, 10.0, 6.0, 11.0, 12.0, 16.0, 28.0, 18.0, 29.0, 32.0, 32.0, 44.0, 43.0, 57.0, 61.0, 56.0, 58.0, 63.0, 45.0, 45.0, 53.0, 49.0, 43.0, 19.0, 32.0, 23.0, 21.0, 14.0, 22.0, 8.0, 7.0, 7.0, 9.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.0773781538009644, -1.0444740056991577, -1.011569857597351, -0.9786656498908997, -0.945761501789093, -0.9128572940826416, -0.879953145980835, -0.8470489978790283, -0.8141448497772217, -0.781240701675415, -0.7483364939689636, -0.715432345867157, -0.6825281977653503, -0.6496239900588989, -0.6167198419570923, -0.5838156938552856, -0.5509114861488342, -0.5180073380470276, -0.48510316014289856, -0.45219898223876953, -0.4192948341369629, -0.38639065623283386, -0.35348647832870483, -0.3205823302268982, -0.28767815232276917, -0.25477397441864014, -0.2218698263168335, -0.18896564841270447, -0.15606148540973663, -0.1231573224067688, -0.09025314450263977, -0.057348981499671936, -0.0244448184967041, 0.008459348231554031, 0.041363514959812164, 0.0742676854133606, 0.10717184841632843, 0.14007601141929626, 0.1729801893234253, 0.20588435232639313, 0.23878851532936096, 0.27169269323349, 0.30459684133529663, 0.33750101923942566, 0.3704051971435547, 0.40330934524536133, 0.43621352314949036, 0.4691177010536194, 0.502021849155426, 0.5349259972572327, 0.5678302049636841, 0.6007343530654907, 0.6336385011672974, 0.666542649269104, 0.6994468569755554, 0.7323510050773621, 0.7652552127838135, 0.7981593608856201, 0.8310635685920715, 0.8639677166938782, 0.8968718647956848, 0.9297760725021362, 0.9626802206039429, 0.9955843687057495, 1.0284885168075562]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 8.0, 5.0, 12.0, 17.0, 25.0, 49.0, 66.0, 125.0, 167.0, 229.0, 390.0, 628.0, 1075.0, 1792.0, 3420.0, 6792.0, 14847.0, 37620.0, 121127.0, 489600.0, 261634.0, 65030.0, 23188.0, 9951.0, 4726.0, 2459.0, 1455.0, 764.0, 481.0, 298.0, 209.0, 115.0, 76.0, 62.0, 39.0, 24.0, 20.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.525390625, -1.48272705078125, -1.4400634765625, -1.39739990234375, -1.354736328125, -1.31207275390625, -1.2694091796875, -1.22674560546875, -1.18408203125, -1.14141845703125, -1.0987548828125, -1.05609130859375, -1.013427734375, -0.97076416015625, -0.9281005859375, -0.88543701171875, -0.8427734375, -0.80010986328125, -0.7574462890625, -0.71478271484375, -0.672119140625, -0.62945556640625, -0.5867919921875, -0.54412841796875, -0.50146484375, -0.45880126953125, -0.4161376953125, -0.37347412109375, -0.330810546875, -0.28814697265625, -0.2454833984375, -0.20281982421875, -0.16015625, -0.11749267578125, -0.0748291015625, -0.03216552734375, 0.010498046875, 0.05316162109375, 0.0958251953125, 0.13848876953125, 0.18115234375, 0.22381591796875, 0.2664794921875, 0.30914306640625, 0.351806640625, 0.39447021484375, 0.4371337890625, 0.47979736328125, 0.5224609375, 0.56512451171875, 0.6077880859375, 0.65045166015625, 0.693115234375, 0.73577880859375, 0.7784423828125, 0.82110595703125, 0.86376953125, 0.90643310546875, 0.9490966796875, 0.99176025390625, 1.034423828125, 1.07708740234375, 1.1197509765625, 1.16241455078125, 1.205078125]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 4.0, 16.0, 12.0, 20.0, 20.0, 27.0, 43.0, 42.0, 58.0, 62.0, 72.0, 66.0, 65.0, 81.0, 61.0, 74.0, 57.0, 38.0, 40.0, 27.0, 19.0, 14.0, 18.0, 14.0, 10.0, 4.0, 9.0, 2.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.927734375, -2.840545654296875, -2.75335693359375, -2.666168212890625, -2.5789794921875, -2.491790771484375, -2.40460205078125, -2.317413330078125, -2.230224609375, -2.143035888671875, -2.05584716796875, -1.968658447265625, -1.8814697265625, -1.794281005859375, -1.70709228515625, -1.619903564453125, -1.53271484375, -1.445526123046875, -1.35833740234375, -1.271148681640625, -1.1839599609375, -1.096771240234375, -1.00958251953125, -0.922393798828125, -0.835205078125, -0.748016357421875, -0.66082763671875, -0.573638916015625, -0.4864501953125, -0.399261474609375, -0.31207275390625, -0.224884033203125, -0.1376953125, -0.050506591796875, 0.03668212890625, 0.123870849609375, 0.2110595703125, 0.298248291015625, 0.38543701171875, 0.472625732421875, 0.559814453125, 0.647003173828125, 0.73419189453125, 0.821380615234375, 0.9085693359375, 0.995758056640625, 1.08294677734375, 1.170135498046875, 1.25732421875, 1.344512939453125, 1.43170166015625, 1.518890380859375, 1.6060791015625, 1.693267822265625, 1.78045654296875, 1.867645263671875, 1.954833984375, 2.042022705078125, 2.12921142578125, 2.216400146484375, 2.3035888671875, 2.390777587890625, 2.47796630859375, 2.565155029296875, 2.65234375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 5.0, 9.0, 5.0, 5.0, 14.0, 12.0, 9.0, 21.0, 22.0, 22.0, 23.0, 39.0, 25.0, 44.0, 44.0, 74.0, 93.0, 311.0, 1883.0, 51684.0, 979498.0, 13177.0, 924.0, 188.0, 94.0, 72.0, 30.0, 33.0, 27.0, 22.0, 21.0, 16.0, 21.0, 13.0, 18.0, 12.0, 8.0, 4.0, 10.0, 4.0, 4.0, 2.0, 6.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.703125, -6.495849609375, -6.28857421875, -6.081298828125, -5.8740234375, -5.666748046875, -5.45947265625, -5.252197265625, -5.044921875, -4.837646484375, -4.63037109375, -4.423095703125, -4.2158203125, -4.008544921875, -3.80126953125, -3.593994140625, -3.38671875, -3.179443359375, -2.97216796875, -2.764892578125, -2.5576171875, -2.350341796875, -2.14306640625, -1.935791015625, -1.728515625, -1.521240234375, -1.31396484375, -1.106689453125, -0.8994140625, -0.692138671875, -0.48486328125, -0.277587890625, -0.0703125, 0.136962890625, 0.34423828125, 0.551513671875, 0.7587890625, 0.966064453125, 1.17333984375, 1.380615234375, 1.587890625, 1.795166015625, 2.00244140625, 2.209716796875, 2.4169921875, 2.624267578125, 2.83154296875, 3.038818359375, 3.24609375, 3.453369140625, 3.66064453125, 3.867919921875, 4.0751953125, 4.282470703125, 4.48974609375, 4.697021484375, 4.904296875, 5.111572265625, 5.31884765625, 5.526123046875, 5.7333984375, 5.940673828125, 6.14794921875, 6.355224609375, 6.5625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 4.0, 8.0, 5.0, 6.0, 15.0, 11.0, 13.0, 14.0, 27.0, 27.0, 29.0, 33.0, 36.0, 38.0, 30.0, 44.0, 39.0, 51.0, 46.0, 52.0, 42.0, 46.0, 44.0, 42.0, 45.0, 31.0, 28.0, 32.0, 19.0, 25.0, 23.0, 16.0, 19.0, 15.0, 9.0, 10.0, 6.0, 9.0, 2.0, 7.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9873046875, -1.9159088134765625, -1.844512939453125, -1.7731170654296875, -1.70172119140625, -1.6303253173828125, -1.558929443359375, -1.4875335693359375, -1.4161376953125, -1.3447418212890625, -1.273345947265625, -1.2019500732421875, -1.13055419921875, -1.0591583251953125, -0.987762451171875, -0.9163665771484375, -0.844970703125, -0.7735748291015625, -0.702178955078125, -0.6307830810546875, -0.55938720703125, -0.4879913330078125, -0.416595458984375, -0.3451995849609375, -0.2738037109375, -0.2024078369140625, -0.131011962890625, -0.0596160888671875, 0.01177978515625, 0.0831756591796875, 0.154571533203125, 0.2259674072265625, 0.29736328125, 0.3687591552734375, 0.440155029296875, 0.5115509033203125, 0.58294677734375, 0.6543426513671875, 0.725738525390625, 0.7971343994140625, 0.8685302734375, 0.9399261474609375, 1.011322021484375, 1.0827178955078125, 1.15411376953125, 1.2255096435546875, 1.296905517578125, 1.3683013916015625, 1.439697265625, 1.5110931396484375, 1.582489013671875, 1.6538848876953125, 1.72528076171875, 1.7966766357421875, 1.868072509765625, 1.9394683837890625, 2.0108642578125, 2.0822601318359375, 2.153656005859375, 2.2250518798828125, 2.29644775390625, 2.3678436279296875, 2.439239501953125, 2.5106353759765625, 2.58203125]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 0.0, 0.0, 4.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 12.0, 6.0, 13.0, 15.0, 17.0, 19.0, 42.0, 42.0, 68.0, 93.0, 188.0, 279.0, 425.0, 901.0, 1808.0, 4125.0, 11360.0, 41583.0, 231141.0, 605608.0, 112937.0, 24311.0, 7634.0, 2841.0, 1334.0, 692.0, 386.0, 215.0, 129.0, 90.0, 68.0, 44.0, 26.0, 28.0, 14.0, 12.0, 10.0, 7.0, 5.0, 4.0, 4.0, 1.0, 3.0, 3.0, 0.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52978515625, -0.5128631591796875, -0.495941162109375, -0.4790191650390625, -0.46209716796875, -0.4451751708984375, -0.428253173828125, -0.4113311767578125, -0.3944091796875, -0.3774871826171875, -0.360565185546875, -0.3436431884765625, -0.32672119140625, -0.3097991943359375, -0.292877197265625, -0.2759552001953125, -0.259033203125, -0.2421112060546875, -0.225189208984375, -0.2082672119140625, -0.19134521484375, -0.1744232177734375, -0.157501220703125, -0.1405792236328125, -0.1236572265625, -0.1067352294921875, -0.089813232421875, -0.0728912353515625, -0.05596923828125, -0.0390472412109375, -0.022125244140625, -0.0052032470703125, 0.01171875, 0.0286407470703125, 0.045562744140625, 0.0624847412109375, 0.07940673828125, 0.0963287353515625, 0.113250732421875, 0.1301727294921875, 0.1470947265625, 0.1640167236328125, 0.180938720703125, 0.1978607177734375, 0.21478271484375, 0.2317047119140625, 0.248626708984375, 0.2655487060546875, 0.282470703125, 0.2993927001953125, 0.316314697265625, 0.3332366943359375, 0.35015869140625, 0.3670806884765625, 0.384002685546875, 0.4009246826171875, 0.4178466796875, 0.4347686767578125, 0.451690673828125, 0.4686126708984375, 0.48553466796875, 0.5024566650390625, 0.519378662109375, 0.5363006591796875, 0.55322265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 4.0, 10.0, 7.0, 15.0, 16.0, 23.0, 19.0, 23.0, 31.0, 36.0, 70.0, 80.0, 95.0, 114.0, 86.0, 78.0, 54.0, 51.0, 39.0, 33.0, 23.0, 13.0, 19.0, 11.0, 10.0, 6.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.375810623168945e-05, -9.087100625038147e-05, -8.798390626907349e-05, -8.50968062877655e-05, -8.220970630645752e-05, -7.932260632514954e-05, -7.643550634384155e-05, -7.354840636253357e-05, -7.066130638122559e-05, -6.77742063999176e-05, -6.488710641860962e-05, -6.200000643730164e-05, -5.911290645599365e-05, -5.622580647468567e-05, -5.3338706493377686e-05, -5.04516065120697e-05, -4.756450653076172e-05, -4.4677406549453735e-05, -4.179030656814575e-05, -3.890320658683777e-05, -3.6016106605529785e-05, -3.31290066242218e-05, -3.024190664291382e-05, -2.7354806661605835e-05, -2.446770668029785e-05, -2.1580606698989868e-05, -1.8693506717681885e-05, -1.58064067363739e-05, -1.2919306755065918e-05, -1.0032206773757935e-05, -7.145106792449951e-06, -4.258006811141968e-06, -1.3709068298339844e-06, 1.516193151473999e-06, 4.403293132781982e-06, 7.290393114089966e-06, 1.017749309539795e-05, 1.3064593076705933e-05, 1.5951693058013916e-05, 1.88387930393219e-05, 2.1725893020629883e-05, 2.4612993001937866e-05, 2.750009298324585e-05, 3.0387192964553833e-05, 3.3274292945861816e-05, 3.61613929271698e-05, 3.904849290847778e-05, 4.1935592889785767e-05, 4.482269287109375e-05, 4.7709792852401733e-05, 5.059689283370972e-05, 5.34839928150177e-05, 5.6371092796325684e-05, 5.925819277763367e-05, 6.214529275894165e-05, 6.503239274024963e-05, 6.791949272155762e-05, 7.08065927028656e-05, 7.369369268417358e-05, 7.658079266548157e-05, 7.946789264678955e-05, 8.235499262809753e-05, 8.524209260940552e-05, 8.81291925907135e-05, 9.101629257202148e-05]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 6.0, 13.0, 11.0, 10.0, 14.0, 30.0, 40.0, 39.0, 61.0, 102.0, 146.0, 279.0, 391.0, 650.0, 1261.0, 2191.0, 4395.0, 9379.0, 23871.0, 77056.0, 341617.0, 438687.0, 97748.0, 28697.0, 11291.0, 4881.0, 2427.0, 1320.0, 709.0, 405.0, 260.0, 181.0, 120.0, 75.0, 58.0, 49.0, 28.0, 20.0, 11.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.380615234375, -0.3670654296875, -0.353515625, -0.3399658203125, -0.326416015625, -0.3128662109375, -0.29931640625, -0.2857666015625, -0.272216796875, -0.2586669921875, -0.2451171875, -0.2315673828125, -0.218017578125, -0.2044677734375, -0.19091796875, -0.1773681640625, -0.163818359375, -0.1502685546875, -0.13671875, -0.1231689453125, -0.109619140625, -0.0960693359375, -0.08251953125, -0.0689697265625, -0.055419921875, -0.0418701171875, -0.0283203125, -0.0147705078125, -0.001220703125, 0.0123291015625, 0.02587890625, 0.0394287109375, 0.052978515625, 0.0665283203125, 0.080078125, 0.0936279296875, 0.107177734375, 0.1207275390625, 0.13427734375, 0.1478271484375, 0.161376953125, 0.1749267578125, 0.1884765625, 0.2020263671875, 0.215576171875, 0.2291259765625, 0.24267578125, 0.2562255859375, 0.269775390625, 0.2833251953125, 0.296875, 0.3104248046875, 0.323974609375, 0.3375244140625, 0.35107421875, 0.3646240234375, 0.378173828125, 0.3917236328125, 0.4052734375, 0.4188232421875, 0.432373046875, 0.4459228515625, 0.45947265625, 0.4730224609375, 0.486572265625]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 11.0, 5.0, 13.0, 11.0, 15.0, 12.0, 19.0, 35.0, 26.0, 46.0, 42.0, 57.0, 63.0, 89.0, 88.0, 73.0, 77.0, 61.0, 60.0, 42.0, 27.0, 37.0, 14.0, 13.0, 17.0, 8.0, 7.0, 10.0, 6.0, 4.0, 0.0, 4.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2193603515625, -0.21265602111816406, -0.20595169067382812, -0.1992473602294922, -0.19254302978515625, -0.1858386993408203, -0.17913436889648438, -0.17243003845214844, -0.1657257080078125, -0.15902137756347656, -0.15231704711914062, -0.1456127166748047, -0.13890838623046875, -0.1322040557861328, -0.12549972534179688, -0.11879539489746094, -0.112091064453125, -0.10538673400878906, -0.09868240356445312, -0.09197807312011719, -0.08527374267578125, -0.07856941223144531, -0.07186508178710938, -0.06516075134277344, -0.0584564208984375, -0.05175209045410156, -0.045047760009765625, -0.03834342956542969, -0.03163909912109375, -0.024934768676757812, -0.018230438232421875, -0.011526107788085938, -0.00482177734375, 0.0018825531005859375, 0.008586883544921875, 0.015291213989257812, 0.02199554443359375, 0.028699874877929688, 0.035404205322265625, 0.04210853576660156, 0.0488128662109375, 0.05551719665527344, 0.062221527099609375, 0.06892585754394531, 0.07563018798828125, 0.08233451843261719, 0.08903884887695312, 0.09574317932128906, 0.102447509765625, 0.10915184020996094, 0.11585617065429688, 0.12256050109863281, 0.12926483154296875, 0.1359691619873047, 0.14267349243164062, 0.14937782287597656, 0.1560821533203125, 0.16278648376464844, 0.16949081420898438, 0.1761951446533203, 0.18289947509765625, 0.1896038055419922, 0.19630813598632812, 0.20301246643066406, 0.209716796875]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 19.0, 29.0, 120.0, 272.0, 344.0, 122.0, 38.0, 21.0, 17.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.135523319244385, -4.795766353607178, -4.4560089111328125, -4.1162519454956055, -3.7764949798583984, -3.4367377758026123, -3.096980571746826, -2.757223606109619, -2.417466402053833, -2.077709197998047, -1.7379522323608398, -1.3981950283050537, -1.0584379434585571, -0.7186808586120605, -0.3789236545562744, -0.03916668891906738, 0.30059051513671875, 0.6403475999832153, 0.9801047444343567, 1.319861888885498, 1.6596189737319946, 1.9993760585784912, 2.3391332626342773, 2.6788902282714844, 3.0186474323272705, 3.3584046363830566, 3.6981616020202637, 4.037919044494629, 4.377676010131836, 4.717432975769043, 5.05718994140625, 5.396946907043457, 5.7367048263549805, 6.0764617919921875, 6.416219234466553, 6.75597620010376, 7.095733165740967, 7.435490608215332, 7.775247573852539, 8.115004539489746, 8.454761505126953, 8.79451847076416, 9.134275436401367, 9.47403335571289, 9.813790321350098, 10.153547286987305, 10.493304252624512, 10.833061218261719, 11.172819137573242, 11.51257610321045, 11.852333068847656, 12.19209098815918, 12.531847953796387, 12.871604919433594, 13.2113618850708, 13.551118850708008, 13.890875816345215, 14.230632781982422, 14.570389747619629, 14.910146713256836, 15.24990463256836, 15.589661598205566, 15.929418563842773, 16.269176483154297, 16.608932495117188]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 7.0, 3.0, 9.0, 12.0, 10.0, 20.0, 14.0, 20.0, 19.0, 27.0, 32.0, 25.0, 27.0, 40.0, 51.0, 50.0, 45.0, 38.0, 41.0, 50.0, 51.0, 36.0, 39.0, 30.0, 30.0, 35.0, 37.0, 32.0, 23.0, 27.0, 19.0, 23.0, 13.0, 10.0, 13.0, 5.0, 10.0, 4.0, 8.0, 2.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0], "bins": [-3.8744328022003174, -3.752547264099121, -3.630661964416504, -3.5087764263153076, -3.3868908882141113, -3.265005588531494, -3.143120050430298, -3.0212345123291016, -2.8993492126464844, -2.777463674545288, -2.655578374862671, -2.5336928367614746, -2.4118072986602783, -2.289921760559082, -2.168036460876465, -2.0461509227752686, -1.9242653846740723, -1.8023799657821655, -1.6804944276809692, -1.5586090087890625, -1.4367234706878662, -1.3148380517959595, -1.1929526329040527, -1.0710670948028564, -0.9491816759109497, -0.8272961974143982, -0.7054107189178467, -0.5835253000259399, -0.4616398215293884, -0.3397543430328369, -0.21786892414093018, -0.09598344564437866, 0.02590203285217285, 0.14778749644756317, 0.2696729600429535, 0.3915584087371826, 0.5134438872337341, 0.6353293657302856, 0.7572147846221924, 0.8791002631187439, 1.0009857416152954, 1.1228711605072021, 1.2447566986083984, 1.3666421175003052, 1.488527536392212, 1.6104130744934082, 1.732298493385315, 1.8541839122772217, 1.976069450378418, 2.0979549884796143, 2.2198402881622314, 2.3417258262634277, 2.463611364364624, 2.5854969024658203, 2.7073822021484375, 2.829267740249634, 2.95115327835083, 3.0730388164520264, 3.1949241161346436, 3.31680965423584, 3.438695192337036, 3.5605807304382324, 3.6824660301208496, 3.804351568222046, 3.926236867904663]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 15.0, 12.0, 22.0, 32.0, 34.0, 65.0, 75.0, 154.0, 208.0, 367.0, 685.0, 1336.0, 2770.0, 7011.0, 21827.0, 102292.0, 1752568.0, 2156839.0, 110894.0, 23587.0, 7548.0, 2921.0, 1367.0, 711.0, 359.0, 202.0, 128.0, 83.0, 68.0, 30.0, 18.0, 16.0, 9.0, 6.0, 12.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.91015625, -1.84197998046875, -1.7738037109375, -1.70562744140625, -1.637451171875, -1.56927490234375, -1.5010986328125, -1.43292236328125, -1.36474609375, -1.29656982421875, -1.2283935546875, -1.16021728515625, -1.092041015625, -1.02386474609375, -0.9556884765625, -0.88751220703125, -0.8193359375, -0.75115966796875, -0.6829833984375, -0.61480712890625, -0.546630859375, -0.47845458984375, -0.4102783203125, -0.34210205078125, -0.27392578125, -0.20574951171875, -0.1375732421875, -0.06939697265625, -0.001220703125, 0.06695556640625, 0.1351318359375, 0.20330810546875, 0.271484375, 0.33966064453125, 0.4078369140625, 0.47601318359375, 0.544189453125, 0.61236572265625, 0.6805419921875, 0.74871826171875, 0.81689453125, 0.88507080078125, 0.9532470703125, 1.02142333984375, 1.089599609375, 1.15777587890625, 1.2259521484375, 1.29412841796875, 1.3623046875, 1.43048095703125, 1.4986572265625, 1.56683349609375, 1.635009765625, 1.70318603515625, 1.7713623046875, 1.83953857421875, 1.90771484375, 1.97589111328125, 2.0440673828125, 2.11224365234375, 2.180419921875, 2.24859619140625, 2.3167724609375, 2.38494873046875, 2.453125]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 2.0, 5.0, 2.0, 5.0, 5.0, 10.0, 11.0, 9.0, 11.0, 21.0, 22.0, 33.0, 45.0, 40.0, 58.0, 53.0, 60.0, 63.0, 66.0, 55.0, 66.0, 56.0, 54.0, 52.0, 40.0, 32.0, 29.0, 15.0, 22.0, 15.0, 10.0, 8.0, 9.0, 5.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6416015625, -1.5928955078125, -1.544189453125, -1.4954833984375, -1.44677734375, -1.3980712890625, -1.349365234375, -1.3006591796875, -1.251953125, -1.2032470703125, -1.154541015625, -1.1058349609375, -1.05712890625, -1.0084228515625, -0.959716796875, -0.9110107421875, -0.8623046875, -0.8135986328125, -0.764892578125, -0.7161865234375, -0.66748046875, -0.6187744140625, -0.570068359375, -0.5213623046875, -0.47265625, -0.4239501953125, -0.375244140625, -0.3265380859375, -0.27783203125, -0.2291259765625, -0.180419921875, -0.1317138671875, -0.0830078125, -0.0343017578125, 0.014404296875, 0.0631103515625, 0.11181640625, 0.1605224609375, 0.209228515625, 0.2579345703125, 0.306640625, 0.3553466796875, 0.404052734375, 0.4527587890625, 0.50146484375, 0.5501708984375, 0.598876953125, 0.6475830078125, 0.6962890625, 0.7449951171875, 0.793701171875, 0.8424072265625, 0.89111328125, 0.9398193359375, 0.988525390625, 1.0372314453125, 1.0859375, 1.1346435546875, 1.183349609375, 1.2320556640625, 1.28076171875, 1.3294677734375, 1.378173828125, 1.4268798828125, 1.4755859375]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 7.0, 11.0, 14.0, 34.0, 51.0, 117.0, 247.0, 1038.0, 20761.0, 4145054.0, 25223.0, 1211.0, 271.0, 109.0, 57.0, 30.0, 13.0, 9.0, 5.0, 2.0, 2.0, 8.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.34375, -9.03759765625, -8.7314453125, -8.42529296875, -8.119140625, -7.81298828125, -7.5068359375, -7.20068359375, -6.89453125, -6.58837890625, -6.2822265625, -5.97607421875, -5.669921875, -5.36376953125, -5.0576171875, -4.75146484375, -4.4453125, -4.13916015625, -3.8330078125, -3.52685546875, -3.220703125, -2.91455078125, -2.6083984375, -2.30224609375, -1.99609375, -1.68994140625, -1.3837890625, -1.07763671875, -0.771484375, -0.46533203125, -0.1591796875, 0.14697265625, 0.453125, 0.75927734375, 1.0654296875, 1.37158203125, 1.677734375, 1.98388671875, 2.2900390625, 2.59619140625, 2.90234375, 3.20849609375, 3.5146484375, 3.82080078125, 4.126953125, 4.43310546875, 4.7392578125, 5.04541015625, 5.3515625, 5.65771484375, 5.9638671875, 6.27001953125, 6.576171875, 6.88232421875, 7.1884765625, 7.49462890625, 7.80078125, 8.10693359375, 8.4130859375, 8.71923828125, 9.025390625, 9.33154296875, 9.6376953125, 9.94384765625, 10.25]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 0.0, 6.0, 6.0, 7.0, 5.0, 12.0, 13.0, 15.0, 22.0, 25.0, 34.0, 55.0, 62.0, 68.0, 125.0, 213.0, 368.0, 817.0, 982.0, 448.0, 233.0, 140.0, 101.0, 77.0, 53.0, 47.0, 28.0, 26.0, 25.0, 15.0, 8.0, 10.0, 9.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.525390625, -0.5090408325195312, -0.4926910400390625, -0.47634124755859375, -0.459991455078125, -0.44364166259765625, -0.4272918701171875, -0.41094207763671875, -0.39459228515625, -0.37824249267578125, -0.3618927001953125, -0.34554290771484375, -0.329193115234375, -0.31284332275390625, -0.2964935302734375, -0.28014373779296875, -0.2637939453125, -0.24744415283203125, -0.2310943603515625, -0.21474456787109375, -0.198394775390625, -0.18204498291015625, -0.1656951904296875, -0.14934539794921875, -0.13299560546875, -0.11664581298828125, -0.1002960205078125, -0.08394622802734375, -0.067596435546875, -0.05124664306640625, -0.0348968505859375, -0.01854705810546875, -0.002197265625, 0.01415252685546875, 0.0305023193359375, 0.04685211181640625, 0.063201904296875, 0.07955169677734375, 0.0959014892578125, 0.11225128173828125, 0.12860107421875, 0.14495086669921875, 0.1613006591796875, 0.17765045166015625, 0.194000244140625, 0.21035003662109375, 0.2266998291015625, 0.24304962158203125, 0.2593994140625, 0.27574920654296875, 0.2920989990234375, 0.30844879150390625, 0.324798583984375, 0.34114837646484375, 0.3574981689453125, 0.37384796142578125, 0.39019775390625, 0.40654754638671875, 0.4228973388671875, 0.43924713134765625, 0.455596923828125, 0.47194671630859375, 0.4882965087890625, 0.5046463012695312, 0.52099609375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 5.0, 12.0, 13.0, 27.0, 47.0, 81.0, 168.0, 191.0, 166.0, 119.0, 64.0, 37.0, 21.0, 13.0, 5.0, 5.0, 3.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.697857856750488, -4.566412448883057, -4.434967041015625, -4.303522109985352, -4.17207670211792, -4.040631294250488, -3.9091858863830566, -3.777740478515625, -3.6462950706481934, -3.5148496627807617, -3.383404493331909, -3.2519590854644775, -3.120513677597046, -2.9890685081481934, -2.8576231002807617, -2.72617769241333, -2.5947325229644775, -2.463287115097046, -2.3318419456481934, -2.2003965377807617, -2.06895112991333, -1.937505841255188, -1.806060552597046, -1.6746151447296143, -1.5431698560714722, -1.41172456741333, -1.2802791595458984, -1.1488338708877563, -1.0173885822296143, -0.8859431743621826, -0.7544978857040405, -0.6230525374412537, -0.4916071891784668, -0.36016184091567993, -0.22871652245521545, -0.09727120399475098, 0.03417414426803589, 0.16561949253082275, 0.29706478118896484, 0.4285101294517517, 0.5599554777145386, 0.6914008259773254, 0.8228461742401123, 0.9542914628982544, 1.0857367515563965, 1.2171821594238281, 1.3486274480819702, 1.4800727367401123, 1.611518144607544, 1.742963433265686, 1.8744088411331177, 2.0058541297912598, 2.1372995376586914, 2.268744945526123, 2.4001901149749756, 2.5316355228424072, 2.6630806922912598, 2.7945261001586914, 2.925971269607544, 3.0574166774749756, 3.1888620853424072, 3.3203072547912598, 3.4517526626586914, 3.583198070526123, 3.7146434783935547]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 4.0, 8.0, 12.0, 10.0, 11.0, 13.0, 20.0, 14.0, 24.0, 31.0, 38.0, 50.0, 51.0, 57.0, 63.0, 52.0, 69.0, 56.0, 48.0, 60.0, 46.0, 51.0, 34.0, 35.0, 29.0, 31.0, 16.0, 17.0, 12.0, 9.0, 8.0, 5.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5557526350021362, -1.5006544589996338, -1.4455562829971313, -1.390458106994629, -1.3353599309921265, -1.280261754989624, -1.225163459777832, -1.1700654029846191, -1.1149671077728271, -1.0598689317703247, -1.0047707557678223, -0.9496725797653198, -0.8945744037628174, -0.8394762277603149, -0.7843779921531677, -0.7292798161506653, -0.6741816997528076, -0.6190835237503052, -0.5639853477478027, -0.5088871717453003, -0.45378896594047546, -0.398690789937973, -0.3435925841331482, -0.28849440813064575, -0.2333962321281433, -0.17829805612564087, -0.12319986522197723, -0.0681016743183136, -0.013003498315811157, 0.042094677686691284, 0.09719288349151611, 0.15229105949401855, 0.207389235496521, 0.26248741149902344, 0.3175855875015259, 0.3726837933063507, 0.42778196930885315, 0.4828801453113556, 0.5379783511161804, 0.5930765271186829, 0.6481747031211853, 0.7032728791236877, 0.7583710551261902, 0.8134692907333374, 0.8685674667358398, 0.9236656427383423, 0.9787638187408447, 1.0338619947433472, 1.0889601707458496, 1.144058346748352, 1.1991565227508545, 1.254254698753357, 1.3093528747558594, 1.3644510507583618, 1.4195492267608643, 1.4746475219726562, 1.5297455787658691, 1.5848437547683716, 1.639941930770874, 1.6950401067733765, 1.750138282775879, 1.8052364587783813, 1.8603346347808838, 1.9154329299926758, 1.9705311059951782]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 13.0, 6.0, 19.0, 17.0, 36.0, 51.0, 64.0, 103.0, 148.0, 253.0, 476.0, 924.0, 2024.0, 5350.0, 17526.0, 85339.0, 616640.0, 265823.0, 37735.0, 9576.0, 3405.0, 1433.0, 690.0, 363.0, 189.0, 109.0, 62.0, 44.0, 33.0, 24.0, 18.0, 25.0, 10.0, 3.0, 4.0, 2.0, 6.0, 6.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1854248046875, -0.1797657012939453, -0.17410659790039062, -0.16844749450683594, -0.16278839111328125, -0.15712928771972656, -0.15147018432617188, -0.1458110809326172, -0.1401519775390625, -0.1344928741455078, -0.12883377075195312, -0.12317466735839844, -0.11751556396484375, -0.11185646057128906, -0.10619735717773438, -0.10053825378417969, -0.094879150390625, -0.08922004699707031, -0.08356094360351562, -0.07790184020996094, -0.07224273681640625, -0.06658363342285156, -0.060924530029296875, -0.05526542663574219, -0.0496063232421875, -0.04394721984863281, -0.038288116455078125, -0.03262901306152344, -0.02696990966796875, -0.021310806274414062, -0.015651702880859375, -0.009992599487304688, -0.00433349609375, 0.0013256072998046875, 0.006984710693359375, 0.012643814086914062, 0.01830291748046875, 0.023962020874023438, 0.029621124267578125, 0.03528022766113281, 0.0409393310546875, 0.04659843444824219, 0.052257537841796875, 0.05791664123535156, 0.06357574462890625, 0.06923484802246094, 0.07489395141601562, 0.08055305480957031, 0.086212158203125, 0.09187126159667969, 0.09753036499023438, 0.10318946838378906, 0.10884857177734375, 0.11450767517089844, 0.12016677856445312, 0.1258258819580078, 0.1314849853515625, 0.1371440887451172, 0.14280319213867188, 0.14846229553222656, 0.15412139892578125, 0.15978050231933594, 0.16543960571289062, 0.1710987091064453, 0.1767578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 7.0, 5.0, 5.0, 7.0, 13.0, 8.0, 12.0, 14.0, 22.0, 29.0, 49.0, 62.0, 50.0, 72.0, 68.0, 75.0, 68.0, 68.0, 70.0, 59.0, 53.0, 31.0, 41.0, 23.0, 20.0, 17.0, 11.0, 15.0, 9.0, 3.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.380859375, -1.336395263671875, -1.29193115234375, -1.247467041015625, -1.2030029296875, -1.158538818359375, -1.11407470703125, -1.069610595703125, -1.025146484375, -0.980682373046875, -0.93621826171875, -0.891754150390625, -0.8472900390625, -0.802825927734375, -0.75836181640625, -0.713897705078125, -0.66943359375, -0.624969482421875, -0.58050537109375, -0.536041259765625, -0.4915771484375, -0.447113037109375, -0.40264892578125, -0.358184814453125, -0.313720703125, -0.269256591796875, -0.22479248046875, -0.180328369140625, -0.1358642578125, -0.091400146484375, -0.04693603515625, -0.002471923828125, 0.0419921875, 0.086456298828125, 0.13092041015625, 0.175384521484375, 0.2198486328125, 0.264312744140625, 0.30877685546875, 0.353240966796875, 0.397705078125, 0.442169189453125, 0.48663330078125, 0.531097412109375, 0.5755615234375, 0.620025634765625, 0.66448974609375, 0.708953857421875, 0.75341796875, 0.797882080078125, 0.84234619140625, 0.886810302734375, 0.9312744140625, 0.975738525390625, 1.02020263671875, 1.064666748046875, 1.109130859375, 1.153594970703125, 1.19805908203125, 1.242523193359375, 1.2869873046875, 1.331451416015625, 1.37591552734375, 1.420379638671875, 1.46484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 10.0, 14.0, 14.0, 18.0, 32.0, 33.0, 47.0, 50.0, 80.0, 99.0, 158.0, 202.0, 304.0, 567.0, 1477.0, 9798.0, 138877.0, 789412.0, 96860.0, 7628.0, 1386.0, 462.0, 293.0, 167.0, 150.0, 117.0, 68.0, 59.0, 43.0, 30.0, 18.0, 20.0, 12.0, 8.0, 7.0, 14.0, 6.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2099609375, -0.20403671264648438, -0.19811248779296875, -0.19218826293945312, -0.1862640380859375, -0.18033981323242188, -0.17441558837890625, -0.16849136352539062, -0.162567138671875, -0.15664291381835938, -0.15071868896484375, -0.14479446411132812, -0.1388702392578125, -0.13294601440429688, -0.12702178955078125, -0.12109756469726562, -0.11517333984375, -0.10924911499023438, -0.10332489013671875, -0.09740066528320312, -0.0914764404296875, -0.08555221557617188, -0.07962799072265625, -0.07370376586914062, -0.067779541015625, -0.061855316162109375, -0.05593109130859375, -0.050006866455078125, -0.0440826416015625, -0.038158416748046875, -0.03223419189453125, -0.026309967041015625, -0.0203857421875, -0.014461517333984375, -0.00853729248046875, -0.002613067626953125, 0.0033111572265625, 0.009235382080078125, 0.01515960693359375, 0.021083831787109375, 0.027008056640625, 0.032932281494140625, 0.03885650634765625, 0.044780731201171875, 0.0507049560546875, 0.056629180908203125, 0.06255340576171875, 0.06847763061523438, 0.07440185546875, 0.08032608032226562, 0.08625030517578125, 0.09217453002929688, 0.0980987548828125, 0.10402297973632812, 0.10994720458984375, 0.11587142944335938, 0.121795654296875, 0.12771987915039062, 0.13364410400390625, 0.13956832885742188, 0.1454925537109375, 0.15141677856445312, 0.15734100341796875, 0.16326522827148438, 0.169189453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 8.0, 6.0, 6.0, 10.0, 12.0, 12.0, 24.0, 18.0, 25.0, 25.0, 39.0, 40.0, 53.0, 38.0, 50.0, 56.0, 42.0, 56.0, 64.0, 54.0, 44.0, 51.0, 33.0, 35.0, 34.0, 23.0, 33.0, 22.0, 20.0, 14.0, 7.0, 15.0, 7.0, 6.0, 3.0, 5.0, 5.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-2.2265625, -2.164337158203125, -2.10211181640625, -2.039886474609375, -1.9776611328125, -1.915435791015625, -1.85321044921875, -1.790985107421875, -1.728759765625, -1.666534423828125, -1.60430908203125, -1.542083740234375, -1.4798583984375, -1.417633056640625, -1.35540771484375, -1.293182373046875, -1.23095703125, -1.168731689453125, -1.10650634765625, -1.044281005859375, -0.9820556640625, -0.919830322265625, -0.85760498046875, -0.795379638671875, -0.733154296875, -0.670928955078125, -0.60870361328125, -0.546478271484375, -0.4842529296875, -0.422027587890625, -0.35980224609375, -0.297576904296875, -0.2353515625, -0.173126220703125, -0.11090087890625, -0.048675537109375, 0.0135498046875, 0.075775146484375, 0.13800048828125, 0.200225830078125, 0.262451171875, 0.324676513671875, 0.38690185546875, 0.449127197265625, 0.5113525390625, 0.573577880859375, 0.63580322265625, 0.698028564453125, 0.76025390625, 0.822479248046875, 0.88470458984375, 0.946929931640625, 1.0091552734375, 1.071380615234375, 1.13360595703125, 1.195831298828125, 1.258056640625, 1.320281982421875, 1.38250732421875, 1.444732666015625, 1.5069580078125, 1.569183349609375, 1.63140869140625, 1.693634033203125, 1.755859375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 9.0, 7.0, 9.0, 16.0, 17.0, 20.0, 32.0, 28.0, 51.0, 39.0, 92.0, 134.0, 248.0, 776.0, 5497.0, 973658.0, 64704.0, 2154.0, 438.0, 206.0, 104.0, 85.0, 63.0, 44.0, 34.0, 28.0, 17.0, 18.0, 5.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.12042236328125, -0.11715030670166016, -0.11387825012207031, -0.11060619354248047, -0.10733413696289062, -0.10406208038330078, -0.10079002380371094, -0.0975179672241211, -0.09424591064453125, -0.0909738540649414, -0.08770179748535156, -0.08442974090576172, -0.08115768432617188, -0.07788562774658203, -0.07461357116699219, -0.07134151458740234, -0.0680694580078125, -0.06479740142822266, -0.06152534484863281, -0.05825328826904297, -0.054981231689453125, -0.05170917510986328, -0.04843711853027344, -0.045165061950683594, -0.04189300537109375, -0.038620948791503906, -0.03534889221191406, -0.03207683563232422, -0.028804779052734375, -0.02553272247314453, -0.022260665893554688, -0.018988609313964844, -0.015716552734375, -0.012444496154785156, -0.009172439575195312, -0.005900382995605469, -0.002628326416015625, 0.0006437301635742188, 0.0039157867431640625, 0.007187843322753906, 0.01045989990234375, 0.013731956481933594, 0.017004013061523438, 0.02027606964111328, 0.023548126220703125, 0.02682018280029297, 0.030092239379882812, 0.033364295959472656, 0.0366363525390625, 0.039908409118652344, 0.04318046569824219, 0.04645252227783203, 0.049724578857421875, 0.05299663543701172, 0.05626869201660156, 0.059540748596191406, 0.06281280517578125, 0.0660848617553711, 0.06935691833496094, 0.07262897491455078, 0.07590103149414062, 0.07917308807373047, 0.08244514465332031, 0.08571720123291016, 0.0889892578125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 6.0, 5.0, 13.0, 35.0, 77.0, 203.0, 344.0, 194.0, 75.0, 30.0, 10.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.123283386230469e-05, -2.908799797296524e-05, -2.6943162083625793e-05, -2.4798326194286346e-05, -2.26534903049469e-05, -2.0508654415607452e-05, -1.8363818526268005e-05, -1.621898263692856e-05, -1.4074146747589111e-05, -1.1929310858249664e-05, -9.784474968910217e-06, -7.63963907957077e-06, -5.494803190231323e-06, -3.3499673008918762e-06, -1.2051314115524292e-06, 9.397044777870178e-07, 3.084540367126465e-06, 5.229376256465912e-06, 7.374212145805359e-06, 9.519048035144806e-06, 1.1663883924484253e-05, 1.38087198138237e-05, 1.5953555703163147e-05, 1.8098391592502594e-05, 2.024322748184204e-05, 2.2388063371181488e-05, 2.4532899260520935e-05, 2.6677735149860382e-05, 2.882257103919983e-05, 3.0967406928539276e-05, 3.311224281787872e-05, 3.525707870721817e-05, 3.740191459655762e-05, 3.9546750485897064e-05, 4.169158637523651e-05, 4.383642226457596e-05, 4.5981258153915405e-05, 4.812609404325485e-05, 5.02709299325943e-05, 5.2415765821933746e-05, 5.456060171127319e-05, 5.670543760061264e-05, 5.885027348995209e-05, 6.0995109379291534e-05, 6.313994526863098e-05, 6.528478115797043e-05, 6.742961704730988e-05, 6.957445293664932e-05, 7.171928882598877e-05, 7.386412471532822e-05, 7.600896060466766e-05, 7.815379649400711e-05, 8.029863238334656e-05, 8.2443468272686e-05, 8.458830416202545e-05, 8.67331400513649e-05, 8.887797594070435e-05, 9.102281183004379e-05, 9.316764771938324e-05, 9.531248360872269e-05, 9.745731949806213e-05, 9.960215538740158e-05, 0.00010174699127674103, 0.00010389182716608047, 0.00010603666305541992]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 7.0, 6.0, 7.0, 8.0, 3.0, 10.0, 17.0, 10.0, 28.0, 35.0, 44.0, 68.0, 100.0, 175.0, 272.0, 546.0, 1065.0, 2635.0, 7985.0, 63648.0, 924861.0, 36584.0, 6410.0, 1990.0, 875.0, 437.0, 218.0, 177.0, 106.0, 60.0, 57.0, 33.0, 23.0, 21.0, 9.0, 10.0, 5.0, 2.0, 5.0, 2.0, 7.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07916259765625, -0.07647037506103516, -0.07377815246582031, -0.07108592987060547, -0.06839370727539062, -0.06570148468017578, -0.06300926208496094, -0.060317039489746094, -0.05762481689453125, -0.054932594299316406, -0.05224037170410156, -0.04954814910888672, -0.046855926513671875, -0.04416370391845703, -0.04147148132324219, -0.038779258728027344, -0.0360870361328125, -0.033394813537597656, -0.030702590942382812, -0.02801036834716797, -0.025318145751953125, -0.02262592315673828, -0.019933700561523438, -0.017241477966308594, -0.01454925537109375, -0.011857032775878906, -0.009164810180664062, -0.006472587585449219, -0.003780364990234375, -0.0010881423950195312, 0.0016040802001953125, 0.004296302795410156, 0.006988525390625, 0.009680747985839844, 0.012372970581054688, 0.015065193176269531, 0.017757415771484375, 0.02044963836669922, 0.023141860961914062, 0.025834083557128906, 0.02852630615234375, 0.031218528747558594, 0.03391075134277344, 0.03660297393798828, 0.039295196533203125, 0.04198741912841797, 0.04467964172363281, 0.047371864318847656, 0.0500640869140625, 0.052756309509277344, 0.05544853210449219, 0.05814075469970703, 0.060832977294921875, 0.06352519989013672, 0.06621742248535156, 0.0689096450805664, 0.07160186767578125, 0.0742940902709961, 0.07698631286621094, 0.07967853546142578, 0.08237075805664062, 0.08506298065185547, 0.08775520324707031, 0.09044742584228516, 0.0931396484375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 9.0, 14.0, 21.0, 22.0, 33.0, 70.0, 173.0, 324.0, 132.0, 59.0, 44.0, 26.0, 18.0, 13.0, 5.0, 5.0, 8.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0171661376953125, -0.016760945320129395, -0.01635575294494629, -0.015950560569763184, -0.015545368194580078, -0.015140175819396973, -0.014734983444213867, -0.014329791069030762, -0.013924598693847656, -0.01351940631866455, -0.013114213943481445, -0.01270902156829834, -0.012303829193115234, -0.011898636817932129, -0.011493444442749023, -0.011088252067565918, -0.010683059692382812, -0.010277867317199707, -0.009872674942016602, -0.009467482566833496, -0.00906229019165039, -0.008657097816467285, -0.00825190544128418, -0.007846713066101074, -0.007441520690917969, -0.007036328315734863, -0.006631135940551758, -0.006225943565368652, -0.005820751190185547, -0.005415558815002441, -0.005010366439819336, -0.0046051740646362305, -0.004199981689453125, -0.0037947893142700195, -0.003389596939086914, -0.0029844045639038086, -0.002579212188720703, -0.0021740198135375977, -0.0017688274383544922, -0.0013636350631713867, -0.0009584426879882812, -0.0005532503128051758, -0.0001480579376220703, 0.00025713443756103516, 0.0006623268127441406, 0.001067519187927246, 0.0014727115631103516, 0.001877903938293457, 0.0022830963134765625, 0.002688288688659668, 0.0030934810638427734, 0.003498673439025879, 0.0039038658142089844, 0.00430905818939209, 0.004714250564575195, 0.005119442939758301, 0.005524635314941406, 0.005929827690124512, 0.006335020065307617, 0.006740212440490723, 0.007145404815673828, 0.007550597190856934, 0.007955789566040039, 0.008360981941223145, 0.00876617431640625]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 6.0, 5.0, 16.0, 29.0, 54.0, 123.0, 244.0, 226.0, 151.0, 55.0, 36.0, 15.0, 12.0, 5.0, 8.0, 4.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.8232192993164062, -3.71435284614563, -3.6054863929748535, -3.496619939804077, -3.387753486633301, -3.2788872718811035, -3.170020818710327, -3.061154365539551, -2.9522879123687744, -2.843421459197998, -2.7345550060272217, -2.6256885528564453, -2.516822338104248, -2.4079556465148926, -2.2990894317626953, -2.190222978591919, -2.0813565254211426, -1.9724900722503662, -1.8636236190795898, -1.754757285118103, -1.6458908319473267, -1.5370243787765503, -1.4281580448150635, -1.319291591644287, -1.2104251384735107, -1.1015586853027344, -0.9926922917366028, -0.8838258981704712, -0.7749594449996948, -0.6660929918289185, -0.5572265982627869, -0.4483602046966553, -0.3394935131072998, -0.23062708973884583, -0.12176066637039185, -0.012894243001937866, 0.09597218036651611, 0.20483863353729248, 0.3137050271034241, 0.42257142066955566, 0.531437873840332, 0.6403043270111084, 0.74917072057724, 0.8580371141433716, 0.966903567314148, 1.0757700204849243, 1.1846363544464111, 1.2935028076171875, 1.4023692607879639, 1.5112357139587402, 1.6201021671295166, 1.7289685010910034, 1.8378349542617798, 1.9467014074325562, 2.055567741394043, 2.1644341945648193, 2.2733006477355957, 2.382167100906372, 2.4910335540771484, 2.599900007247925, 2.708766460418701, 2.8176326751708984, 2.926499128341675, 3.035365581512451, 3.1442320346832275]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 6.0, 12.0, 8.0, 11.0, 12.0, 18.0, 23.0, 30.0, 48.0, 58.0, 64.0, 79.0, 85.0, 80.0, 64.0, 83.0, 61.0, 51.0, 45.0, 41.0, 35.0, 14.0, 21.0, 16.0, 7.0, 5.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2564345598220825, -1.2110927104949951, -1.1657508611679077, -1.1204090118408203, -1.075067162513733, -1.0297253131866455, -0.9843835234642029, -0.9390417337417603, -0.8936998844146729, -0.8483580350875854, -0.803016185760498, -0.7576743364334106, -0.712332546710968, -0.6669906973838806, -0.6216488480567932, -0.5763070583343506, -0.5309651494026184, -0.485623300075531, -0.440281480550766, -0.3949396312236786, -0.3495978116989136, -0.30425596237182617, -0.25891411304473877, -0.21357229351997375, -0.16823044419288635, -0.12288860976696014, -0.07754676789045334, -0.03220492601394653, 0.013136908411979675, 0.058478742837905884, 0.10382059216499329, 0.1491624116897583, 0.1945042610168457, 0.2398460954427719, 0.2851879298686981, 0.3305297791957855, 0.37587159872055054, 0.42121344804763794, 0.46655529737472534, 0.511897087097168, 0.5572389364242554, 0.6025807857513428, 0.6479226350784302, 0.6932644844055176, 0.7386062741279602, 0.7839481234550476, 0.829289972782135, 0.8746317625045776, 0.9199736714363098, 0.9653155207633972, 1.0106573104858398, 1.0559991598129272, 1.1013410091400146, 1.146682858467102, 1.1920247077941895, 1.2373665571212769, 1.2827084064483643, 1.3280502557754517, 1.373392105102539, 1.4187339544296265, 1.4640758037567139, 1.5094175338745117, 1.5547595024108887, 1.6001012325286865, 1.645443081855774]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 5.0, 4.0, 4.0, 8.0, 18.0, 36.0, 88.0, 287.0, 2050.0, 52535.0, 966615.0, 25169.0, 1320.0, 233.0, 78.0, 31.0, 16.0, 9.0, 8.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.51171875, -4.326904296875, -4.14208984375, -3.957275390625, -3.7724609375, -3.587646484375, -3.40283203125, -3.218017578125, -3.033203125, -2.848388671875, -2.66357421875, -2.478759765625, -2.2939453125, -2.109130859375, -1.92431640625, -1.739501953125, -1.5546875, -1.369873046875, -1.18505859375, -1.000244140625, -0.8154296875, -0.630615234375, -0.44580078125, -0.260986328125, -0.076171875, 0.108642578125, 0.29345703125, 0.478271484375, 0.6630859375, 0.847900390625, 1.03271484375, 1.217529296875, 1.40234375, 1.587158203125, 1.77197265625, 1.956787109375, 2.1416015625, 2.326416015625, 2.51123046875, 2.696044921875, 2.880859375, 3.065673828125, 3.25048828125, 3.435302734375, 3.6201171875, 3.804931640625, 3.98974609375, 4.174560546875, 4.359375, 4.544189453125, 4.72900390625, 4.913818359375, 5.0986328125, 5.283447265625, 5.46826171875, 5.653076171875, 5.837890625, 6.022705078125, 6.20751953125, 6.392333984375, 6.5771484375, 6.761962890625, 6.94677734375, 7.131591796875, 7.31640625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 11.0, 9.0, 7.0, 15.0, 16.0, 18.0, 33.0, 46.0, 37.0, 60.0, 65.0, 66.0, 69.0, 91.0, 75.0, 64.0, 58.0, 57.0, 39.0, 31.0, 23.0, 23.0, 20.0, 12.0, 11.0, 5.0, 3.0, 5.0, 4.0, 1.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.064453125, -2.969573974609375, -2.87469482421875, -2.779815673828125, -2.6849365234375, -2.590057373046875, -2.49517822265625, -2.400299072265625, -2.305419921875, -2.210540771484375, -2.11566162109375, -2.020782470703125, -1.9259033203125, -1.831024169921875, -1.73614501953125, -1.641265869140625, -1.54638671875, -1.451507568359375, -1.35662841796875, -1.261749267578125, -1.1668701171875, -1.071990966796875, -0.97711181640625, -0.882232666015625, -0.787353515625, -0.692474365234375, -0.59759521484375, -0.502716064453125, -0.4078369140625, -0.312957763671875, -0.21807861328125, -0.123199462890625, -0.0283203125, 0.066558837890625, 0.16143798828125, 0.256317138671875, 0.3511962890625, 0.446075439453125, 0.54095458984375, 0.635833740234375, 0.730712890625, 0.825592041015625, 0.92047119140625, 1.015350341796875, 1.1102294921875, 1.205108642578125, 1.29998779296875, 1.394866943359375, 1.48974609375, 1.584625244140625, 1.67950439453125, 1.774383544921875, 1.8692626953125, 1.964141845703125, 2.05902099609375, 2.153900146484375, 2.248779296875, 2.343658447265625, 2.43853759765625, 2.533416748046875, 2.6282958984375, 2.723175048828125, 2.81805419921875, 2.912933349609375, 3.0078125]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 7.0, 12.0, 14.0, 18.0, 24.0, 11.0, 20.0, 32.0, 31.0, 33.0, 45.0, 61.0, 83.0, 100.0, 143.0, 265.0, 865.0, 4561.0, 55435.0, 868115.0, 109736.0, 6794.0, 1137.0, 321.0, 154.0, 105.0, 78.0, 47.0, 59.0, 33.0, 49.0, 28.0, 17.0, 19.0, 17.0, 13.0, 9.0, 7.0, 7.0, 5.0, 7.0, 5.0, 6.0, 6.0, 4.0, 5.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.064453125, -2.970458984375, -2.87646484375, -2.782470703125, -2.6884765625, -2.594482421875, -2.50048828125, -2.406494140625, -2.3125, -2.218505859375, -2.12451171875, -2.030517578125, -1.9365234375, -1.842529296875, -1.74853515625, -1.654541015625, -1.560546875, -1.466552734375, -1.37255859375, -1.278564453125, -1.1845703125, -1.090576171875, -0.99658203125, -0.902587890625, -0.80859375, -0.714599609375, -0.62060546875, -0.526611328125, -0.4326171875, -0.338623046875, -0.24462890625, -0.150634765625, -0.056640625, 0.037353515625, 0.13134765625, 0.225341796875, 0.3193359375, 0.413330078125, 0.50732421875, 0.601318359375, 0.6953125, 0.789306640625, 0.88330078125, 0.977294921875, 1.0712890625, 1.165283203125, 1.25927734375, 1.353271484375, 1.447265625, 1.541259765625, 1.63525390625, 1.729248046875, 1.8232421875, 1.917236328125, 2.01123046875, 2.105224609375, 2.19921875, 2.293212890625, 2.38720703125, 2.481201171875, 2.5751953125, 2.669189453125, 2.76318359375, 2.857177734375, 2.951171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 5.0, 10.0, 10.0, 12.0, 11.0, 13.0, 14.0, 16.0, 19.0, 26.0, 29.0, 30.0, 27.0, 27.0, 33.0, 45.0, 32.0, 42.0, 34.0, 48.0, 34.0, 39.0, 45.0, 32.0, 40.0, 30.0, 35.0, 32.0, 24.0, 32.0, 25.0, 24.0, 15.0, 21.0, 13.0, 10.0, 8.0, 10.0, 4.0, 5.0, 5.0, 5.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-2.3671875, -2.294708251953125, -2.22222900390625, -2.149749755859375, -2.0772705078125, -2.004791259765625, -1.93231201171875, -1.859832763671875, -1.787353515625, -1.714874267578125, -1.64239501953125, -1.569915771484375, -1.4974365234375, -1.424957275390625, -1.35247802734375, -1.279998779296875, -1.20751953125, -1.135040283203125, -1.06256103515625, -0.990081787109375, -0.9176025390625, -0.845123291015625, -0.77264404296875, -0.700164794921875, -0.627685546875, -0.555206298828125, -0.48272705078125, -0.410247802734375, -0.3377685546875, -0.265289306640625, -0.19281005859375, -0.120330810546875, -0.0478515625, 0.024627685546875, 0.09710693359375, 0.169586181640625, 0.2420654296875, 0.314544677734375, 0.38702392578125, 0.459503173828125, 0.531982421875, 0.604461669921875, 0.67694091796875, 0.749420166015625, 0.8218994140625, 0.894378662109375, 0.96685791015625, 1.039337158203125, 1.11181640625, 1.184295654296875, 1.25677490234375, 1.329254150390625, 1.4017333984375, 1.474212646484375, 1.54669189453125, 1.619171142578125, 1.691650390625, 1.764129638671875, 1.83660888671875, 1.909088134765625, 1.9815673828125, 2.054046630859375, 2.12652587890625, 2.199005126953125, 2.271484375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 3.0, 5.0, 10.0, 14.0, 17.0, 18.0, 44.0, 53.0, 90.0, 142.0, 212.0, 346.0, 617.0, 975.0, 2081.0, 4205.0, 10050.0, 28631.0, 110217.0, 504842.0, 292142.0, 61922.0, 18179.0, 6972.0, 3179.0, 1487.0, 811.0, 515.0, 267.0, 164.0, 130.0, 65.0, 43.0, 31.0, 19.0, 18.0, 8.0, 8.0, 9.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3876953125, -0.3742332458496094, -0.36077117919921875, -0.3473091125488281, -0.3338470458984375, -0.3203849792480469, -0.30692291259765625, -0.2934608459472656, -0.279998779296875, -0.2665367126464844, -0.25307464599609375, -0.23961257934570312, -0.2261505126953125, -0.21268844604492188, -0.19922637939453125, -0.18576431274414062, -0.17230224609375, -0.15884017944335938, -0.14537811279296875, -0.13191604614257812, -0.1184539794921875, -0.10499191284179688, -0.09152984619140625, -0.07806777954101562, -0.064605712890625, -0.051143646240234375, -0.03768157958984375, -0.024219512939453125, -0.0107574462890625, 0.002704620361328125, 0.01616668701171875, 0.029628753662109375, 0.0430908203125, 0.056552886962890625, 0.07001495361328125, 0.08347702026367188, 0.0969390869140625, 0.11040115356445312, 0.12386322021484375, 0.13732528686523438, 0.150787353515625, 0.16424942016601562, 0.17771148681640625, 0.19117355346679688, 0.2046356201171875, 0.21809768676757812, 0.23155975341796875, 0.24502182006835938, 0.25848388671875, 0.2719459533691406, 0.28540802001953125, 0.2988700866699219, 0.3123321533203125, 0.3257942199707031, 0.33925628662109375, 0.3527183532714844, 0.366180419921875, 0.3796424865722656, 0.39310455322265625, 0.4065666198730469, 0.4200286865234375, 0.4334907531738281, 0.44695281982421875, 0.4604148864746094, 0.473876953125]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 6.0, 14.0, 20.0, 33.0, 44.0, 54.0, 82.0, 96.0, 107.0, 116.0, 110.0, 105.0, 57.0, 41.0, 31.0, 24.0, 17.0, 8.0, 7.0, 5.0, 5.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.775161743164062e-05, -9.451806545257568e-05, -9.128451347351074e-05, -8.80509614944458e-05, -8.481740951538086e-05, -8.158385753631592e-05, -7.835030555725098e-05, -7.511675357818604e-05, -7.18832015991211e-05, -6.864964962005615e-05, -6.541609764099121e-05, -6.218254566192627e-05, -5.894899368286133e-05, -5.571544170379639e-05, -5.2481889724731445e-05, -4.9248337745666504e-05, -4.601478576660156e-05, -4.278123378753662e-05, -3.954768180847168e-05, -3.631412982940674e-05, -3.30805778503418e-05, -2.9847025871276855e-05, -2.6613473892211914e-05, -2.3379921913146973e-05, -2.014636993408203e-05, -1.691281795501709e-05, -1.3679265975952148e-05, -1.0445713996887207e-05, -7.212162017822266e-06, -3.978610038757324e-06, -7.450580596923828e-07, 2.4884939193725586e-06, 5.7220458984375e-06, 8.955597877502441e-06, 1.2189149856567383e-05, 1.5422701835632324e-05, 1.8656253814697266e-05, 2.1889805793762207e-05, 2.512335777282715e-05, 2.835690975189209e-05, 3.159046173095703e-05, 3.482401371002197e-05, 3.8057565689086914e-05, 4.1291117668151855e-05, 4.45246696472168e-05, 4.775822162628174e-05, 5.099177360534668e-05, 5.422532558441162e-05, 5.745887756347656e-05, 6.0692429542541504e-05, 6.392598152160645e-05, 6.715953350067139e-05, 7.039308547973633e-05, 7.362663745880127e-05, 7.686018943786621e-05, 8.009374141693115e-05, 8.33272933959961e-05, 8.656084537506104e-05, 8.979439735412598e-05, 9.302794933319092e-05, 9.626150131225586e-05, 9.94950532913208e-05, 0.00010272860527038574, 0.00010596215724945068, 0.00010919570922851562]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 4.0, 12.0, 14.0, 7.0, 19.0, 36.0, 36.0, 61.0, 75.0, 110.0, 186.0, 246.0, 474.0, 890.0, 1872.0, 4191.0, 11225.0, 39824.0, 224842.0, 606728.0, 118754.0, 24890.0, 7713.0, 3061.0, 1433.0, 751.0, 402.0, 236.0, 150.0, 91.0, 56.0, 34.0, 24.0, 24.0, 12.0, 11.0, 18.0, 10.0, 7.0, 7.0, 2.0, 1.0, 7.0, 1.0, 1.0, 0.0, 4.0], "bins": [-0.60302734375, -0.5864295959472656, -0.5698318481445312, -0.5532341003417969, -0.5366363525390625, -0.5200386047363281, -0.5034408569335938, -0.4868431091308594, -0.470245361328125, -0.4536476135253906, -0.43704986572265625, -0.4204521179199219, -0.4038543701171875, -0.3872566223144531, -0.37065887451171875, -0.3540611267089844, -0.33746337890625, -0.3208656311035156, -0.30426788330078125, -0.2876701354980469, -0.2710723876953125, -0.2544746398925781, -0.23787689208984375, -0.22127914428710938, -0.204681396484375, -0.18808364868164062, -0.17148590087890625, -0.15488815307617188, -0.1382904052734375, -0.12169265747070312, -0.10509490966796875, -0.08849716186523438, -0.0718994140625, -0.055301666259765625, -0.03870391845703125, -0.022106170654296875, -0.0055084228515625, 0.011089324951171875, 0.02768707275390625, 0.044284820556640625, 0.060882568359375, 0.07748031616210938, 0.09407806396484375, 0.11067581176757812, 0.1272735595703125, 0.14387130737304688, 0.16046905517578125, 0.17706680297851562, 0.19366455078125, 0.21026229858398438, 0.22686004638671875, 0.24345779418945312, 0.2600555419921875, 0.2766532897949219, 0.29325103759765625, 0.3098487854003906, 0.326446533203125, 0.3430442810058594, 0.35964202880859375, 0.3762397766113281, 0.3928375244140625, 0.4094352722167969, 0.42603302001953125, 0.4426307678222656, 0.459228515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 8.0, 0.0, 6.0, 9.0, 8.0, 7.0, 10.0, 10.0, 17.0, 17.0, 47.0, 46.0, 43.0, 74.0, 73.0, 99.0, 105.0, 88.0, 84.0, 56.0, 49.0, 34.0, 25.0, 15.0, 12.0, 10.0, 11.0, 8.0, 5.0, 5.0, 1.0, 5.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.25830078125, -0.2507362365722656, -0.24317169189453125, -0.23560714721679688, -0.2280426025390625, -0.22047805786132812, -0.21291351318359375, -0.20534896850585938, -0.197784423828125, -0.19021987915039062, -0.18265533447265625, -0.17509078979492188, -0.1675262451171875, -0.15996170043945312, -0.15239715576171875, -0.14483261108398438, -0.13726806640625, -0.12970352172851562, -0.12213897705078125, -0.11457443237304688, -0.1070098876953125, -0.09944534301757812, -0.09188079833984375, -0.08431625366210938, -0.076751708984375, -0.06918716430664062, -0.06162261962890625, -0.054058074951171875, -0.0464935302734375, -0.038928985595703125, -0.03136444091796875, -0.023799896240234375, -0.0162353515625, -0.008670806884765625, -0.00110626220703125, 0.006458282470703125, 0.0140228271484375, 0.021587371826171875, 0.02915191650390625, 0.036716461181640625, 0.044281005859375, 0.051845550537109375, 0.05941009521484375, 0.06697463989257812, 0.0745391845703125, 0.08210372924804688, 0.08966827392578125, 0.09723281860351562, 0.10479736328125, 0.11236190795898438, 0.11992645263671875, 0.12749099731445312, 0.1350555419921875, 0.14262008666992188, 0.15018463134765625, 0.15774917602539062, 0.165313720703125, 0.17287826538085938, 0.18044281005859375, 0.18800735473632812, 0.1955718994140625, 0.20313644409179688, 0.21070098876953125, 0.21826553344726562, 0.225830078125]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 8.0, 3.0, 16.0, 49.0, 130.0, 338.0, 280.0, 112.0, 31.0, 15.0, 8.0, 10.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.274903297424316, -13.925827026367188, -13.576750755310059, -13.22767448425293, -12.8785982131958, -12.529521942138672, -12.180445671081543, -11.831369400024414, -11.482293128967285, -11.133216857910156, -10.784140586853027, -10.435064315795898, -10.08598804473877, -9.73691177368164, -9.387835502624512, -9.038759231567383, -8.689682960510254, -8.340606689453125, -7.991530418395996, -7.642454147338867, -7.293377876281738, -6.944301605224609, -6.5952253341674805, -6.246149063110352, -5.897072792053223, -5.547996520996094, -5.198920249938965, -4.849843978881836, -4.500767707824707, -4.151691436767578, -3.802615165710449, -3.4535388946533203, -3.1044626235961914, -2.7553863525390625, -2.4063100814819336, -2.0572338104248047, -1.7081575393676758, -1.3590812683105469, -1.010004997253418, -0.6609287261962891, -0.31185245513916016, 0.03722381591796875, 0.38630008697509766, 0.7353763580322266, 1.0844526290893555, 1.4335289001464844, 1.7826051712036133, 2.131681442260742, 2.480757713317871, 2.829833984375, 3.178910255432129, 3.527986526489258, 3.8770627975463867, 4.226139068603516, 4.5752153396606445, 4.924291610717773, 5.273367881774902, 5.622444152832031, 5.97152042388916, 6.320596694946289, 6.669672966003418, 7.018749237060547, 7.367825508117676, 7.716901779174805, 8.065978050231934]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 4.0, 9.0, 5.0, 10.0, 13.0, 12.0, 14.0, 13.0, 17.0, 23.0, 16.0, 28.0, 32.0, 42.0, 30.0, 27.0, 45.0, 43.0, 54.0, 49.0, 63.0, 43.0, 41.0, 49.0, 39.0, 36.0, 37.0, 29.0, 30.0, 30.0, 14.0, 18.0, 15.0, 15.0, 12.0, 12.0, 7.0, 4.0, 5.0, 2.0, 3.0, 5.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.055614471435547, -3.9046711921691895, -3.753728151321411, -3.602785110473633, -3.4518418312072754, -3.300898551940918, -3.1499555110931396, -2.9990124702453613, -2.848069190979004, -2.6971259117126465, -2.546182870864868, -2.39523983001709, -2.2442965507507324, -2.093353271484375, -1.9424102306365967, -1.7914670705795288, -1.640523910522461, -1.489580750465393, -1.3386375904083252, -1.1876944303512573, -1.0367512702941895, -0.8858081102371216, -0.7348649501800537, -0.5839217901229858, -0.43297863006591797, -0.2820354700088501, -0.13109230995178223, 0.019850850105285645, 0.17079401016235352, 0.3217371702194214, 0.47268033027648926, 0.6236234903335571, 0.7745671272277832, 0.9255102872848511, 1.076453447341919, 1.2273966073989868, 1.3783397674560547, 1.5292829275131226, 1.6802260875701904, 1.8311692476272583, 1.9821124076843262, 2.1330556869506836, 2.283998727798462, 2.4349417686462402, 2.5858850479125977, 2.736828327178955, 2.8877713680267334, 3.0387144088745117, 3.189657688140869, 3.3406009674072266, 3.491544008255005, 3.642487049102783, 3.7934303283691406, 3.944373607635498, 4.0953168869018555, 4.246259689331055, 4.397202968597412, 4.5481462478637695, 4.699089050292969, 4.850032329559326, 5.000975608825684, 5.151918888092041, 5.302862167358398, 5.453804969787598, 5.604748249053955]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 14.0, 16.0, 14.0, 15.0, 25.0, 35.0, 62.0, 75.0, 144.0, 205.0, 382.0, 610.0, 1152.0, 2208.0, 5146.0, 14479.0, 54614.0, 517049.0, 3410533.0, 144409.0, 27326.0, 8693.0, 3461.0, 1569.0, 819.0, 475.0, 254.0, 147.0, 112.0, 67.0, 59.0, 22.0, 25.0, 20.0, 16.0, 11.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.12109375, -2.048614501953125, -1.97613525390625, -1.903656005859375, -1.8311767578125, -1.758697509765625, -1.68621826171875, -1.613739013671875, -1.541259765625, -1.468780517578125, -1.39630126953125, -1.323822021484375, -1.2513427734375, -1.178863525390625, -1.10638427734375, -1.033905029296875, -0.96142578125, -0.888946533203125, -0.81646728515625, -0.743988037109375, -0.6715087890625, -0.599029541015625, -0.52655029296875, -0.454071044921875, -0.381591796875, -0.309112548828125, -0.23663330078125, -0.164154052734375, -0.0916748046875, -0.019195556640625, 0.05328369140625, 0.125762939453125, 0.1982421875, 0.270721435546875, 0.34320068359375, 0.415679931640625, 0.4881591796875, 0.560638427734375, 0.63311767578125, 0.705596923828125, 0.778076171875, 0.850555419921875, 0.92303466796875, 0.995513916015625, 1.0679931640625, 1.140472412109375, 1.21295166015625, 1.285430908203125, 1.35791015625, 1.430389404296875, 1.50286865234375, 1.575347900390625, 1.6478271484375, 1.720306396484375, 1.79278564453125, 1.865264892578125, 1.937744140625, 2.010223388671875, 2.08270263671875, 2.155181884765625, 2.2276611328125, 2.300140380859375, 2.37261962890625, 2.445098876953125, 2.517578125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 2.0, 3.0, 11.0, 9.0, 16.0, 16.0, 25.0, 21.0, 34.0, 52.0, 46.0, 56.0, 73.0, 71.0, 77.0, 70.0, 71.0, 62.0, 56.0, 55.0, 35.0, 29.0, 24.0, 11.0, 14.0, 14.0, 15.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8134765625, -1.7582244873046875, -1.702972412109375, -1.6477203369140625, -1.59246826171875, -1.5372161865234375, -1.481964111328125, -1.4267120361328125, -1.3714599609375, -1.3162078857421875, -1.260955810546875, -1.2057037353515625, -1.15045166015625, -1.0951995849609375, -1.039947509765625, -0.9846954345703125, -0.929443359375, -0.8741912841796875, -0.818939208984375, -0.7636871337890625, -0.70843505859375, -0.6531829833984375, -0.597930908203125, -0.5426788330078125, -0.4874267578125, -0.4321746826171875, -0.376922607421875, -0.3216705322265625, -0.26641845703125, -0.2111663818359375, -0.155914306640625, -0.1006622314453125, -0.04541015625, 0.0098419189453125, 0.065093994140625, 0.1203460693359375, 0.17559814453125, 0.2308502197265625, 0.286102294921875, 0.3413543701171875, 0.3966064453125, 0.4518585205078125, 0.507110595703125, 0.5623626708984375, 0.61761474609375, 0.6728668212890625, 0.728118896484375, 0.7833709716796875, 0.838623046875, 0.8938751220703125, 0.949127197265625, 1.0043792724609375, 1.05963134765625, 1.1148834228515625, 1.170135498046875, 1.2253875732421875, 1.2806396484375, 1.3358917236328125, 1.391143798828125, 1.4463958740234375, 1.50164794921875, 1.5569000244140625, 1.612152099609375, 1.6674041748046875, 1.72265625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 10.0, 5.0, 9.0, 14.0, 22.0, 18.0, 29.0, 34.0, 95.0, 208.0, 496.0, 2104.0, 25208.0, 4067669.0, 93143.0, 3978.0, 717.0, 231.0, 109.0, 64.0, 38.0, 32.0, 15.0, 8.0, 9.0, 4.0, 4.0, 1.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.66796875, -5.455322265625, -5.24267578125, -5.030029296875, -4.8173828125, -4.604736328125, -4.39208984375, -4.179443359375, -3.966796875, -3.754150390625, -3.54150390625, -3.328857421875, -3.1162109375, -2.903564453125, -2.69091796875, -2.478271484375, -2.265625, -2.052978515625, -1.84033203125, -1.627685546875, -1.4150390625, -1.202392578125, -0.98974609375, -0.777099609375, -0.564453125, -0.351806640625, -0.13916015625, 0.073486328125, 0.2861328125, 0.498779296875, 0.71142578125, 0.924072265625, 1.13671875, 1.349365234375, 1.56201171875, 1.774658203125, 1.9873046875, 2.199951171875, 2.41259765625, 2.625244140625, 2.837890625, 3.050537109375, 3.26318359375, 3.475830078125, 3.6884765625, 3.901123046875, 4.11376953125, 4.326416015625, 4.5390625, 4.751708984375, 4.96435546875, 5.177001953125, 5.3896484375, 5.602294921875, 5.81494140625, 6.027587890625, 6.240234375, 6.452880859375, 6.66552734375, 6.878173828125, 7.0908203125, 7.303466796875, 7.51611328125, 7.728759765625, 7.94140625]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 5.0, 11.0, 9.0, 20.0, 23.0, 44.0, 52.0, 93.0, 104.0, 205.0, 442.0, 1618.0, 760.0, 236.0, 157.0, 94.0, 55.0, 39.0, 29.0, 24.0, 15.0, 11.0, 4.0, 7.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82861328125, -0.8054351806640625, -0.782257080078125, -0.7590789794921875, -0.73590087890625, -0.7127227783203125, -0.689544677734375, -0.6663665771484375, -0.6431884765625, -0.6200103759765625, -0.596832275390625, -0.5736541748046875, -0.55047607421875, -0.5272979736328125, -0.504119873046875, -0.4809417724609375, -0.457763671875, -0.4345855712890625, -0.411407470703125, -0.3882293701171875, -0.36505126953125, -0.3418731689453125, -0.318695068359375, -0.2955169677734375, -0.2723388671875, -0.2491607666015625, -0.225982666015625, -0.2028045654296875, -0.17962646484375, -0.1564483642578125, -0.133270263671875, -0.1100921630859375, -0.0869140625, -0.0637359619140625, -0.040557861328125, -0.0173797607421875, 0.00579833984375, 0.0289764404296875, 0.052154541015625, 0.0753326416015625, 0.0985107421875, 0.1216888427734375, 0.144866943359375, 0.1680450439453125, 0.19122314453125, 0.2144012451171875, 0.237579345703125, 0.2607574462890625, 0.283935546875, 0.3071136474609375, 0.330291748046875, 0.3534698486328125, 0.37664794921875, 0.3998260498046875, 0.423004150390625, 0.4461822509765625, 0.4693603515625, 0.4925384521484375, 0.515716552734375, 0.5388946533203125, 0.56207275390625, 0.5852508544921875, 0.608428955078125, 0.6316070556640625, 0.65478515625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 11.0, 13.0, 15.0, 21.0, 50.0, 88.0, 190.0, 235.0, 188.0, 81.0, 43.0, 22.0, 13.0, 8.0, 9.0, 11.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.692881107330322, -6.5391998291015625, -6.385518550872803, -6.231837749481201, -6.078156471252441, -5.924475193023682, -5.770793914794922, -5.617112636566162, -5.463431358337402, -5.309750080108643, -5.156068801879883, -5.002388000488281, -4.8487067222595215, -4.695025444030762, -4.541344165802002, -4.387662887573242, -4.233982086181641, -4.080300807952881, -3.9266197681427, -3.7729384899139404, -3.6192574501037598, -3.465576171875, -3.3118948936462402, -3.1582136154174805, -3.0045325756073, -2.85085129737854, -2.6971702575683594, -2.5434889793395996, -2.38980770111084, -2.236126661300659, -2.0824453830718994, -1.9287642240524292, -1.775083303451538, -1.6214021444320679, -1.4677209854125977, -1.314039707183838, -1.1603585481643677, -1.0066773891448975, -0.8529961705207825, -0.6993149518966675, -0.5456337928771973, -0.39195260405540466, -0.23827141523361206, -0.08459022641181946, 0.06909096240997314, 0.22277212142944336, 0.37645334005355835, 0.5301345586776733, 0.6838157176971436, 0.8374968767166138, 0.9911780953407288, 1.1448593139648438, 1.298540472984314, 1.4522216320037842, 1.605902910232544, 1.7595840692520142, 1.9132652282714844, 2.066946506500244, 2.220627546310425, 2.3743088245391846, 2.5279898643493652, 2.681671142578125, 2.8353524208068848, 2.9890336990356445, 3.142714738845825]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 12.0, 13.0, 16.0, 18.0, 18.0, 23.0, 32.0, 40.0, 56.0, 51.0, 57.0, 73.0, 49.0, 63.0, 78.0, 63.0, 65.0, 46.0, 50.0, 25.0, 30.0, 24.0, 16.0, 17.0, 13.0, 11.0, 11.0, 4.0, 7.0, 3.0, 1.0, 0.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7186754941940308, -1.656463861465454, -1.594252347946167, -1.5320407152175903, -1.4698290824890137, -1.407617449760437, -1.3454058170318604, -1.2831943035125732, -1.2209826707839966, -1.15877103805542, -1.0965595245361328, -1.0343478918075562, -0.9721362590789795, -0.9099246263504028, -0.847713053226471, -0.7855014801025391, -0.7232898473739624, -0.6610782146453857, -0.5988666415214539, -0.536655068397522, -0.4744434356689453, -0.41223183274269104, -0.35002022981643677, -0.2878086268901825, -0.22559702396392822, -0.16338542103767395, -0.10117381811141968, -0.038962215185165405, 0.023249387741088867, 0.08546099066734314, 0.1476725935935974, 0.20988419651985168, 0.2720959186553955, 0.3343075215816498, 0.39651912450790405, 0.4587307274341583, 0.5209423303604126, 0.5831539630889893, 0.6453655362129211, 0.707577109336853, 0.7697887420654297, 0.8320003747940063, 0.8942119479179382, 0.9564235210418701, 1.0186351537704468, 1.0808467864990234, 1.1430583000183105, 1.2052699327468872, 1.2674815654754639, 1.3296931982040405, 1.3919048309326172, 1.4541163444519043, 1.516327977180481, 1.5785396099090576, 1.6407511234283447, 1.7029627561569214, 1.765174388885498, 1.8273860216140747, 1.8895976543426514, 1.9518091678619385, 2.0140209197998047, 2.076232433319092, 2.138443946838379, 2.200655698776245, 2.2628672122955322]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 3.0, 4.0, 9.0, 9.0, 18.0, 20.0, 15.0, 33.0, 53.0, 83.0, 126.0, 176.0, 257.0, 424.0, 702.0, 1174.0, 2101.0, 4217.0, 8470.0, 19796.0, 56936.0, 212582.0, 502344.0, 161046.0, 45767.0, 16658.0, 7196.0, 3625.0, 1841.0, 1084.0, 643.0, 385.0, 274.0, 162.0, 97.0, 69.0, 38.0, 33.0, 25.0, 21.0, 14.0, 11.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09918212890625, -0.0958089828491211, -0.09243583679199219, -0.08906269073486328, -0.08568954467773438, -0.08231639862060547, -0.07894325256347656, -0.07557010650634766, -0.07219696044921875, -0.06882381439208984, -0.06545066833496094, -0.06207752227783203, -0.058704376220703125, -0.05533123016357422, -0.05195808410644531, -0.048584938049316406, -0.0452117919921875, -0.041838645935058594, -0.03846549987792969, -0.03509235382080078, -0.031719207763671875, -0.02834606170654297, -0.024972915649414062, -0.021599769592285156, -0.01822662353515625, -0.014853477478027344, -0.011480331420898438, -0.008107185363769531, -0.004734039306640625, -0.0013608932495117188, 0.0020122528076171875, 0.005385398864746094, 0.008758544921875, 0.012131690979003906, 0.015504837036132812, 0.01887798309326172, 0.022251129150390625, 0.02562427520751953, 0.028997421264648438, 0.032370567321777344, 0.03574371337890625, 0.039116859436035156, 0.04249000549316406, 0.04586315155029297, 0.049236297607421875, 0.05260944366455078, 0.05598258972167969, 0.059355735778808594, 0.0627288818359375, 0.0661020278930664, 0.06947517395019531, 0.07284832000732422, 0.07622146606445312, 0.07959461212158203, 0.08296775817871094, 0.08634090423583984, 0.08971405029296875, 0.09308719635009766, 0.09646034240722656, 0.09983348846435547, 0.10320663452148438, 0.10657978057861328, 0.10995292663574219, 0.1133260726928711, 0.11669921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 9.0, 17.0, 22.0, 21.0, 29.0, 48.0, 54.0, 62.0, 78.0, 82.0, 100.0, 88.0, 77.0, 72.0, 54.0, 49.0, 32.0, 21.0, 24.0, 13.0, 9.0, 14.0, 3.0, 7.0, 0.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5361328125, -1.4805755615234375, -1.425018310546875, -1.3694610595703125, -1.31390380859375, -1.2583465576171875, -1.202789306640625, -1.1472320556640625, -1.0916748046875, -1.0361175537109375, -0.980560302734375, -0.9250030517578125, -0.86944580078125, -0.8138885498046875, -0.758331298828125, -0.7027740478515625, -0.647216796875, -0.5916595458984375, -0.536102294921875, -0.4805450439453125, -0.42498779296875, -0.3694305419921875, -0.313873291015625, -0.2583160400390625, -0.2027587890625, -0.1472015380859375, -0.091644287109375, -0.0360870361328125, 0.01947021484375, 0.0750274658203125, 0.130584716796875, 0.1861419677734375, 0.24169921875, 0.2972564697265625, 0.352813720703125, 0.4083709716796875, 0.46392822265625, 0.5194854736328125, 0.575042724609375, 0.6305999755859375, 0.6861572265625, 0.7417144775390625, 0.797271728515625, 0.8528289794921875, 0.90838623046875, 0.9639434814453125, 1.019500732421875, 1.0750579833984375, 1.130615234375, 1.1861724853515625, 1.241729736328125, 1.2972869873046875, 1.35284423828125, 1.4084014892578125, 1.463958740234375, 1.5195159912109375, 1.5750732421875, 1.6306304931640625, 1.686187744140625, 1.7417449951171875, 1.79730224609375, 1.8528594970703125, 1.908416748046875, 1.9639739990234375, 2.01953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 7.0, 3.0, 10.0, 11.0, 12.0, 17.0, 29.0, 36.0, 42.0, 58.0, 95.0, 178.0, 207.0, 444.0, 1316.0, 7356.0, 104749.0, 825492.0, 98049.0, 7884.0, 1339.0, 462.0, 282.0, 149.0, 93.0, 54.0, 48.0, 36.0, 24.0, 19.0, 15.0, 12.0, 9.0, 7.0, 4.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2117919921875, -0.2040882110595703, -0.19638442993164062, -0.18868064880371094, -0.18097686767578125, -0.17327308654785156, -0.16556930541992188, -0.1578655242919922, -0.1501617431640625, -0.1424579620361328, -0.13475418090820312, -0.12705039978027344, -0.11934661865234375, -0.11164283752441406, -0.10393905639648438, -0.09623527526855469, -0.088531494140625, -0.08082771301269531, -0.07312393188476562, -0.06542015075683594, -0.05771636962890625, -0.05001258850097656, -0.042308807373046875, -0.03460502624511719, -0.0269012451171875, -0.019197463989257812, -0.011493682861328125, -0.0037899017333984375, 0.00391387939453125, 0.011617660522460938, 0.019321441650390625, 0.027025222778320312, 0.03472900390625, 0.04243278503417969, 0.050136566162109375, 0.05784034729003906, 0.06554412841796875, 0.07324790954589844, 0.08095169067382812, 0.08865547180175781, 0.0963592529296875, 0.10406303405761719, 0.11176681518554688, 0.11947059631347656, 0.12717437744140625, 0.13487815856933594, 0.14258193969726562, 0.1502857208251953, 0.157989501953125, 0.1656932830810547, 0.17339706420898438, 0.18110084533691406, 0.18880462646484375, 0.19650840759277344, 0.20421218872070312, 0.2119159698486328, 0.2196197509765625, 0.2273235321044922, 0.23502731323242188, 0.24273109436035156, 0.25043487548828125, 0.25813865661621094, 0.2658424377441406, 0.2735462188720703, 0.28125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 9.0, 4.0, 0.0, 5.0, 8.0, 9.0, 11.0, 25.0, 17.0, 25.0, 36.0, 34.0, 35.0, 46.0, 50.0, 42.0, 50.0, 41.0, 47.0, 65.0, 70.0, 55.0, 51.0, 44.0, 42.0, 31.0, 26.0, 24.0, 18.0, 20.0, 8.0, 14.0, 11.0, 9.0, 5.0, 3.0, 4.0, 5.0, 2.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.173828125, -2.0953369140625, -2.016845703125, -1.9383544921875, -1.85986328125, -1.7813720703125, -1.702880859375, -1.6243896484375, -1.5458984375, -1.4674072265625, -1.388916015625, -1.3104248046875, -1.23193359375, -1.1534423828125, -1.074951171875, -0.9964599609375, -0.91796875, -0.8394775390625, -0.760986328125, -0.6824951171875, -0.60400390625, -0.5255126953125, -0.447021484375, -0.3685302734375, -0.2900390625, -0.2115478515625, -0.133056640625, -0.0545654296875, 0.02392578125, 0.1024169921875, 0.180908203125, 0.2593994140625, 0.337890625, 0.4163818359375, 0.494873046875, 0.5733642578125, 0.65185546875, 0.7303466796875, 0.808837890625, 0.8873291015625, 0.9658203125, 1.0443115234375, 1.122802734375, 1.2012939453125, 1.27978515625, 1.3582763671875, 1.436767578125, 1.5152587890625, 1.59375, 1.6722412109375, 1.750732421875, 1.8292236328125, 1.90771484375, 1.9862060546875, 2.064697265625, 2.1431884765625, 2.2216796875, 2.3001708984375, 2.378662109375, 2.4571533203125, 2.53564453125, 2.6141357421875, 2.692626953125, 2.7711181640625, 2.849609375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 6.0, 6.0, 1.0, 2.0, 3.0, 2.0, 7.0, 14.0, 13.0, 26.0, 32.0, 50.0, 87.0, 160.0, 316.0, 745.0, 2656.0, 569554.0, 470945.0, 2631.0, 586.0, 305.0, 155.0, 89.0, 51.0, 29.0, 26.0, 14.0, 13.0, 7.0, 5.0, 3.0, 4.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07598876953125, -0.07294845581054688, -0.06990814208984375, -0.06686782836914062, -0.0638275146484375, -0.060787200927734375, -0.05774688720703125, -0.054706573486328125, -0.051666259765625, -0.048625946044921875, -0.04558563232421875, -0.042545318603515625, -0.0395050048828125, -0.036464691162109375, -0.03342437744140625, -0.030384063720703125, -0.02734375, -0.024303436279296875, -0.02126312255859375, -0.018222808837890625, -0.0151824951171875, -0.012142181396484375, -0.00910186767578125, -0.006061553955078125, -0.003021240234375, 1.9073486328125e-05, 0.00305938720703125, 0.006099700927734375, 0.0091400146484375, 0.012180328369140625, 0.01522064208984375, 0.018260955810546875, 0.02130126953125, 0.024341583251953125, 0.02738189697265625, 0.030422210693359375, 0.0334625244140625, 0.036502838134765625, 0.03954315185546875, 0.042583465576171875, 0.045623779296875, 0.048664093017578125, 0.05170440673828125, 0.054744720458984375, 0.0577850341796875, 0.060825347900390625, 0.06386566162109375, 0.06690597534179688, 0.0699462890625, 0.07298660278320312, 0.07602691650390625, 0.07906723022460938, 0.0821075439453125, 0.08514785766601562, 0.08818817138671875, 0.09122848510742188, 0.094268798828125, 0.09730911254882812, 0.10034942626953125, 0.10338973999023438, 0.1064300537109375, 0.10947036743164062, 0.11251068115234375, 0.11555099487304688, 0.11859130859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 6.0, 11.0, 7.0, 8.0, 14.0, 21.0, 22.0, 28.0, 43.0, 61.0, 70.0, 77.0, 87.0, 73.0, 81.0, 96.0, 76.0, 53.0, 41.0, 26.0, 30.0, 14.0, 16.0, 13.0, 6.0, 5.0, 4.0, 5.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.0325183868408203e-05, -1.9739381968975067e-05, -1.915358006954193e-05, -1.8567778170108795e-05, -1.798197627067566e-05, -1.7396174371242523e-05, -1.6810372471809387e-05, -1.622457057237625e-05, -1.5638768672943115e-05, -1.505296677350998e-05, -1.4467164874076843e-05, -1.3881362974643707e-05, -1.3295561075210571e-05, -1.2709759175777435e-05, -1.21239572763443e-05, -1.1538155376911163e-05, -1.0952353477478027e-05, -1.0366551578044891e-05, -9.780749678611755e-06, -9.19494777917862e-06, -8.609145879745483e-06, -8.023343980312347e-06, -7.4375420808792114e-06, -6.8517401814460754e-06, -6.2659382820129395e-06, -5.6801363825798035e-06, -5.0943344831466675e-06, -4.5085325837135315e-06, -3.9227306842803955e-06, -3.3369287848472595e-06, -2.7511268854141235e-06, -2.1653249859809875e-06, -1.5795230865478516e-06, -9.937211871147156e-07, -4.079192876815796e-07, 1.778826117515564e-07, 7.636845111846924e-07, 1.3494864106178284e-06, 1.9352883100509644e-06, 2.5210902094841003e-06, 3.1068921089172363e-06, 3.6926940083503723e-06, 4.278495907783508e-06, 4.864297807216644e-06, 5.45009970664978e-06, 6.035901606082916e-06, 6.621703505516052e-06, 7.207505404949188e-06, 7.793307304382324e-06, 8.37910920381546e-06, 8.964911103248596e-06, 9.550713002681732e-06, 1.0136514902114868e-05, 1.0722316801548004e-05, 1.130811870098114e-05, 1.1893920600414276e-05, 1.2479722499847412e-05, 1.3065524399280548e-05, 1.3651326298713684e-05, 1.423712819814682e-05, 1.4822930097579956e-05, 1.5408731997013092e-05, 1.5994533896446228e-05, 1.6580335795879364e-05, 1.71661376953125e-05]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 7.0, 7.0, 9.0, 25.0, 29.0, 39.0, 74.0, 141.0, 254.0, 670.0, 2006.0, 10616.0, 491193.0, 529911.0, 10491.0, 1933.0, 622.0, 254.0, 106.0, 64.0, 38.0, 21.0, 14.0, 10.0, 4.0, 4.0, 7.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0787353515625, -0.07570743560791016, -0.07267951965332031, -0.06965160369873047, -0.06662368774414062, -0.06359577178955078, -0.06056785583496094, -0.057539939880371094, -0.05451202392578125, -0.051484107971191406, -0.04845619201660156, -0.04542827606201172, -0.042400360107421875, -0.03937244415283203, -0.03634452819824219, -0.033316612243652344, -0.0302886962890625, -0.027260780334472656, -0.024232864379882812, -0.02120494842529297, -0.018177032470703125, -0.015149116516113281, -0.012121200561523438, -0.009093284606933594, -0.00606536865234375, -0.0030374526977539062, -9.5367431640625e-06, 0.0030183792114257812, 0.006046295166015625, 0.009074211120605469, 0.012102127075195312, 0.015130043029785156, 0.018157958984375, 0.021185874938964844, 0.024213790893554688, 0.02724170684814453, 0.030269622802734375, 0.03329753875732422, 0.03632545471191406, 0.039353370666503906, 0.04238128662109375, 0.045409202575683594, 0.04843711853027344, 0.05146503448486328, 0.054492950439453125, 0.05752086639404297, 0.06054878234863281, 0.06357669830322266, 0.0666046142578125, 0.06963253021240234, 0.07266044616699219, 0.07568836212158203, 0.07871627807617188, 0.08174419403076172, 0.08477210998535156, 0.0878000259399414, 0.09082794189453125, 0.0938558578491211, 0.09688377380371094, 0.09991168975830078, 0.10293960571289062, 0.10596752166748047, 0.10899543762207031, 0.11202335357666016, 0.11505126953125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 8.0, 10.0, 12.0, 20.0, 29.0, 66.0, 168.0, 363.0, 135.0, 64.0, 22.0, 18.0, 17.0, 14.0, 10.0, 12.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0205078125, -0.019943594932556152, -0.019379377365112305, -0.018815159797668457, -0.01825094223022461, -0.01768672466278076, -0.017122507095336914, -0.016558289527893066, -0.01599407196044922, -0.015429854393005371, -0.014865636825561523, -0.014301419258117676, -0.013737201690673828, -0.01317298412322998, -0.012608766555786133, -0.012044548988342285, -0.011480331420898438, -0.01091611385345459, -0.010351896286010742, -0.009787678718566895, -0.009223461151123047, -0.0086592435836792, -0.008095026016235352, -0.007530808448791504, -0.006966590881347656, -0.006402373313903809, -0.005838155746459961, -0.005273938179016113, -0.004709720611572266, -0.004145503044128418, -0.0035812854766845703, -0.0030170679092407227, -0.002452850341796875, -0.0018886327743530273, -0.0013244152069091797, -0.000760197639465332, -0.00019598007202148438, 0.0003682374954223633, 0.0009324550628662109, 0.0014966726303100586, 0.0020608901977539062, 0.002625107765197754, 0.0031893253326416016, 0.0037535429000854492, 0.004317760467529297, 0.0048819780349731445, 0.005446195602416992, 0.00601041316986084, 0.0065746307373046875, 0.007138848304748535, 0.007703065872192383, 0.00826728343963623, 0.008831501007080078, 0.009395718574523926, 0.009959936141967773, 0.010524153709411621, 0.011088371276855469, 0.011652588844299316, 0.012216806411743164, 0.012781023979187012, 0.01334524154663086, 0.013909459114074707, 0.014473676681518555, 0.015037894248962402, 0.01560211181640625]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 16.0, 10.0, 25.0, 53.0, 97.0, 237.0, 299.0, 138.0, 56.0, 21.0, 14.0, 11.0, 16.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.168915271759033, -5.043398857116699, -4.917882442474365, -4.7923665046691895, -4.6668500900268555, -4.5413336753845215, -4.4158172607421875, -4.290301322937012, -4.164784908294678, -4.039268493652344, -3.913752317428589, -3.788235902786255, -3.6627197265625, -3.537203311920166, -3.411686897277832, -3.286170721054077, -3.160654306411743, -3.035137891769409, -2.9096217155456543, -2.7841053009033203, -2.6585891246795654, -2.5330727100372314, -2.4075565338134766, -2.2820401191711426, -2.1565237045288086, -2.0310072898864746, -1.9054911136627197, -1.7799746990203857, -1.6544585227966309, -1.5289421081542969, -1.4034258127212524, -1.277909517288208, -1.1523935794830322, -1.0268772840499878, -0.9013609886169434, -0.7758446335792542, -0.6503283381462097, -0.5248120427131653, -0.3992956876754761, -0.27377939224243164, -0.1482630968093872, -0.02274678647518158, 0.10276952385902405, 0.22828584909439087, 0.3538021445274353, 0.47931843996047974, 0.604834794998169, 0.7303510904312134, 0.8558673858642578, 0.9813836812973022, 1.1068999767303467, 1.2324163913726807, 1.3579325675964355, 1.4834489822387695, 1.608965277671814, 1.7344815731048584, 1.8599978685379028, 1.9855141639709473, 2.1110305786132812, 2.236546754837036, 2.36206316947937, 2.487579345703125, 2.613095760345459, 2.738612174987793, 2.864128351211548]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 8.0, 16.0, 18.0, 18.0, 24.0, 27.0, 31.0, 55.0, 67.0, 71.0, 95.0, 70.0, 84.0, 87.0, 72.0, 56.0, 46.0, 35.0, 27.0, 22.0, 18.0, 14.0, 9.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3749933242797852, -1.3238755464553833, -1.272757887840271, -1.2216401100158691, -1.1705224514007568, -1.119404673576355, -1.0682870149612427, -1.0171692371368408, -0.9660515785217285, -0.9149338603019714, -0.8638161420822144, -0.8126984238624573, -0.7615807056427002, -0.7104629278182983, -0.659345269203186, -0.6082274913787842, -0.5571097731590271, -0.50599205493927, -0.45487433671951294, -0.40375661849975586, -0.3526389002799988, -0.3015211522579193, -0.25040343403816223, -0.19928571581840515, -0.14816799759864807, -0.09705027937889099, -0.045932553708553314, 0.005185171961784363, 0.05630289018154144, 0.10742062330245972, 0.1585383415222168, 0.20965605974197388, 0.26077377796173096, 0.31189149618148804, 0.3630092144012451, 0.4141269326210022, 0.4652446508407593, 0.5163624286651611, 0.5674800872802734, 0.6185978651046753, 0.6697155237197876, 0.7208332419395447, 0.7719509601593018, 0.8230686783790588, 0.8741863965988159, 0.9253041744232178, 0.9764218330383301, 1.027539610862732, 1.0786573886871338, 1.1297751665115356, 1.180892825126648, 1.2320106029510498, 1.283128261566162, 1.334246039390564, 1.3853636980056763, 1.4364814758300781, 1.4875991344451904, 1.5387169122695923, 1.5898345708847046, 1.6409523487091064, 1.6920700073242188, 1.7431877851486206, 1.794305443763733, 1.8454232215881348, 1.896540880203247]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 5.0, 7.0, 3.0, 8.0, 18.0, 34.0, 94.0, 324.0, 1047.0, 6274.0, 180208.0, 841444.0, 16532.0, 1851.0, 446.0, 151.0, 57.0, 18.0, 10.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.986328125, -3.854278564453125, -3.72222900390625, -3.590179443359375, -3.4581298828125, -3.326080322265625, -3.19403076171875, -3.061981201171875, -2.929931640625, -2.797882080078125, -2.66583251953125, -2.533782958984375, -2.4017333984375, -2.269683837890625, -2.13763427734375, -2.005584716796875, -1.87353515625, -1.741485595703125, -1.60943603515625, -1.477386474609375, -1.3453369140625, -1.213287353515625, -1.08123779296875, -0.949188232421875, -0.817138671875, -0.685089111328125, -0.55303955078125, -0.420989990234375, -0.2889404296875, -0.156890869140625, -0.02484130859375, 0.107208251953125, 0.2392578125, 0.371307373046875, 0.50335693359375, 0.635406494140625, 0.7674560546875, 0.899505615234375, 1.03155517578125, 1.163604736328125, 1.295654296875, 1.427703857421875, 1.55975341796875, 1.691802978515625, 1.8238525390625, 1.955902099609375, 2.08795166015625, 2.220001220703125, 2.35205078125, 2.484100341796875, 2.61614990234375, 2.748199462890625, 2.8802490234375, 3.012298583984375, 3.14434814453125, 3.276397705078125, 3.408447265625, 3.540496826171875, 3.67254638671875, 3.804595947265625, 3.9366455078125, 4.068695068359375, 4.20074462890625, 4.332794189453125, 4.46484375]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 12.0, 9.0, 9.0, 10.0, 20.0, 22.0, 23.0, 32.0, 44.0, 59.0, 69.0, 74.0, 83.0, 85.0, 83.0, 77.0, 46.0, 48.0, 31.0, 32.0, 30.0, 26.0, 15.0, 9.0, 11.0, 11.0, 7.0, 6.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.974609375, -2.865966796875, -2.75732421875, -2.648681640625, -2.5400390625, -2.431396484375, -2.32275390625, -2.214111328125, -2.10546875, -1.996826171875, -1.88818359375, -1.779541015625, -1.6708984375, -1.562255859375, -1.45361328125, -1.344970703125, -1.236328125, -1.127685546875, -1.01904296875, -0.910400390625, -0.8017578125, -0.693115234375, -0.58447265625, -0.475830078125, -0.3671875, -0.258544921875, -0.14990234375, -0.041259765625, 0.0673828125, 0.176025390625, 0.28466796875, 0.393310546875, 0.501953125, 0.610595703125, 0.71923828125, 0.827880859375, 0.9365234375, 1.045166015625, 1.15380859375, 1.262451171875, 1.37109375, 1.479736328125, 1.58837890625, 1.697021484375, 1.8056640625, 1.914306640625, 2.02294921875, 2.131591796875, 2.240234375, 2.348876953125, 2.45751953125, 2.566162109375, 2.6748046875, 2.783447265625, 2.89208984375, 3.000732421875, 3.109375, 3.218017578125, 3.32666015625, 3.435302734375, 3.5439453125, 3.652587890625, 3.76123046875, 3.869873046875, 3.978515625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 3.0, 6.0, 3.0, 2.0, 8.0, 7.0, 9.0, 9.0, 11.0, 11.0, 24.0, 30.0, 43.0, 39.0, 61.0, 65.0, 137.0, 171.0, 301.0, 535.0, 1089.0, 2616.0, 7630.0, 34006.0, 308741.0, 613216.0, 61548.0, 11420.0, 3607.0, 1428.0, 678.0, 377.0, 246.0, 128.0, 93.0, 64.0, 47.0, 37.0, 22.0, 25.0, 13.0, 14.0, 11.0, 7.0, 6.0, 2.0, 9.0, 5.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2734375, -1.2297515869140625, -1.186065673828125, -1.1423797607421875, -1.09869384765625, -1.0550079345703125, -1.011322021484375, -0.9676361083984375, -0.9239501953125, -0.8802642822265625, -0.836578369140625, -0.7928924560546875, -0.74920654296875, -0.7055206298828125, -0.661834716796875, -0.6181488037109375, -0.574462890625, -0.5307769775390625, -0.487091064453125, -0.4434051513671875, -0.39971923828125, -0.3560333251953125, -0.312347412109375, -0.2686614990234375, -0.2249755859375, -0.1812896728515625, -0.137603759765625, -0.0939178466796875, -0.05023193359375, -0.0065460205078125, 0.037139892578125, 0.0808258056640625, 0.12451171875, 0.1681976318359375, 0.211883544921875, 0.2555694580078125, 0.29925537109375, 0.3429412841796875, 0.386627197265625, 0.4303131103515625, 0.4739990234375, 0.5176849365234375, 0.561370849609375, 0.6050567626953125, 0.64874267578125, 0.6924285888671875, 0.736114501953125, 0.7798004150390625, 0.823486328125, 0.8671722412109375, 0.910858154296875, 0.9545440673828125, 0.99822998046875, 1.0419158935546875, 1.085601806640625, 1.1292877197265625, 1.1729736328125, 1.2166595458984375, 1.260345458984375, 1.3040313720703125, 1.34771728515625, 1.3914031982421875, 1.435089111328125, 1.4787750244140625, 1.5224609375]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 9.0, 12.0, 14.0, 18.0, 20.0, 20.0, 28.0, 28.0, 33.0, 37.0, 36.0, 39.0, 43.0, 45.0, 44.0, 47.0, 45.0, 43.0, 51.0, 45.0, 48.0, 34.0, 22.0, 34.0, 29.0, 21.0, 29.0, 25.0, 11.0, 17.0, 12.0, 10.0, 10.0, 5.0, 5.0, 3.0, 2.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.92578125, -2.828277587890625, -2.73077392578125, -2.633270263671875, -2.5357666015625, -2.438262939453125, -2.34075927734375, -2.243255615234375, -2.145751953125, -2.048248291015625, -1.95074462890625, -1.853240966796875, -1.7557373046875, -1.658233642578125, -1.56072998046875, -1.463226318359375, -1.36572265625, -1.268218994140625, -1.17071533203125, -1.073211669921875, -0.9757080078125, -0.878204345703125, -0.78070068359375, -0.683197021484375, -0.585693359375, -0.488189697265625, -0.39068603515625, -0.293182373046875, -0.1956787109375, -0.098175048828125, -0.00067138671875, 0.096832275390625, 0.1943359375, 0.291839599609375, 0.38934326171875, 0.486846923828125, 0.5843505859375, 0.681854248046875, 0.77935791015625, 0.876861572265625, 0.974365234375, 1.071868896484375, 1.16937255859375, 1.266876220703125, 1.3643798828125, 1.461883544921875, 1.55938720703125, 1.656890869140625, 1.75439453125, 1.851898193359375, 1.94940185546875, 2.046905517578125, 2.1444091796875, 2.241912841796875, 2.33941650390625, 2.436920166015625, 2.534423828125, 2.631927490234375, 2.72943115234375, 2.826934814453125, 2.9244384765625, 3.021942138671875, 3.11944580078125, 3.216949462890625, 3.314453125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 7.0, 18.0, 28.0, 41.0, 40.0, 79.0, 131.0, 227.0, 465.0, 904.0, 2287.0, 6541.0, 26951.0, 201568.0, 704455.0, 83035.0, 14767.0, 4037.0, 1496.0, 678.0, 342.0, 168.0, 111.0, 56.0, 34.0, 22.0, 23.0, 11.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.67626953125, -0.6571121215820312, -0.6379547119140625, -0.6187973022460938, -0.599639892578125, -0.5804824829101562, -0.5613250732421875, -0.5421676635742188, -0.52301025390625, -0.5038528442382812, -0.4846954345703125, -0.46553802490234375, -0.446380615234375, -0.42722320556640625, -0.4080657958984375, -0.38890838623046875, -0.3697509765625, -0.35059356689453125, -0.3314361572265625, -0.31227874755859375, -0.293121337890625, -0.27396392822265625, -0.2548065185546875, -0.23564910888671875, -0.21649169921875, -0.19733428955078125, -0.1781768798828125, -0.15901947021484375, -0.139862060546875, -0.12070465087890625, -0.1015472412109375, -0.08238983154296875, -0.063232421875, -0.04407501220703125, -0.0249176025390625, -0.00576019287109375, 0.013397216796875, 0.03255462646484375, 0.0517120361328125, 0.07086944580078125, 0.09002685546875, 0.10918426513671875, 0.1283416748046875, 0.14749908447265625, 0.166656494140625, 0.18581390380859375, 0.2049713134765625, 0.22412872314453125, 0.2432861328125, 0.26244354248046875, 0.2816009521484375, 0.30075836181640625, 0.319915771484375, 0.33907318115234375, 0.3582305908203125, 0.37738800048828125, 0.39654541015625, 0.41570281982421875, 0.4348602294921875, 0.45401763916015625, 0.473175048828125, 0.49233245849609375, 0.5114898681640625, 0.5306472778320312, 0.5498046875]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 10.0, 4.0, 8.0, 16.0, 16.0, 16.0, 22.0, 43.0, 61.0, 70.0, 108.0, 185.0, 124.0, 85.0, 56.0, 58.0, 25.0, 25.0, 17.0, 18.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.85860824584961e-05, -9.537674486637115e-05, -9.216740727424622e-05, -8.895806968212128e-05, -8.574873208999634e-05, -8.25393944978714e-05, -7.933005690574646e-05, -7.612071931362152e-05, -7.291138172149658e-05, -6.970204412937164e-05, -6.64927065372467e-05, -6.328336894512177e-05, -6.0074031352996826e-05, -5.686469376087189e-05, -5.365535616874695e-05, -5.044601857662201e-05, -4.723668098449707e-05, -4.402734339237213e-05, -4.081800580024719e-05, -3.7608668208122253e-05, -3.4399330615997314e-05, -3.1189993023872375e-05, -2.7980655431747437e-05, -2.4771317839622498e-05, -2.156198024749756e-05, -1.835264265537262e-05, -1.514330506324768e-05, -1.1933967471122742e-05, -8.724629878997803e-06, -5.515292286872864e-06, -2.305954694747925e-06, 9.033828973770142e-07, 4.112720489501953e-06, 7.322058081626892e-06, 1.0531395673751831e-05, 1.374073326587677e-05, 1.695007085800171e-05, 2.0159408450126648e-05, 2.3368746042251587e-05, 2.6578083634376526e-05, 2.9787421226501465e-05, 3.2996758818626404e-05, 3.620609641075134e-05, 3.941543400287628e-05, 4.262477159500122e-05, 4.583410918712616e-05, 4.90434467792511e-05, 5.225278437137604e-05, 5.5462121963500977e-05, 5.8671459555625916e-05, 6.188079714775085e-05, 6.50901347398758e-05, 6.829947233200073e-05, 7.150880992412567e-05, 7.471814751625061e-05, 7.792748510837555e-05, 8.113682270050049e-05, 8.434616029262543e-05, 8.755549788475037e-05, 9.07648354768753e-05, 9.397417306900024e-05, 9.718351066112518e-05, 0.00010039284825325012, 0.00010360218584537506, 0.0001068115234375]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 5.0, 4.0, 4.0, 10.0, 16.0, 24.0, 31.0, 43.0, 65.0, 106.0, 158.0, 271.0, 439.0, 881.0, 2043.0, 4717.0, 14346.0, 57948.0, 451630.0, 436531.0, 56821.0, 13943.0, 4611.0, 1875.0, 866.0, 418.0, 259.0, 159.0, 103.0, 66.0, 40.0, 35.0, 21.0, 12.0, 12.0, 6.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50634765625, -0.48888397216796875, -0.4714202880859375, -0.45395660400390625, -0.436492919921875, -0.41902923583984375, -0.4015655517578125, -0.38410186767578125, -0.36663818359375, -0.34917449951171875, -0.3317108154296875, -0.31424713134765625, -0.296783447265625, -0.27931976318359375, -0.2618560791015625, -0.24439239501953125, -0.2269287109375, -0.20946502685546875, -0.1920013427734375, -0.17453765869140625, -0.157073974609375, -0.13961029052734375, -0.1221466064453125, -0.10468292236328125, -0.08721923828125, -0.06975555419921875, -0.0522918701171875, -0.03482818603515625, -0.017364501953125, 9.918212890625e-05, 0.0175628662109375, 0.03502655029296875, 0.052490234375, 0.06995391845703125, 0.0874176025390625, 0.10488128662109375, 0.122344970703125, 0.13980865478515625, 0.1572723388671875, 0.17473602294921875, 0.19219970703125, 0.20966339111328125, 0.2271270751953125, 0.24459075927734375, 0.262054443359375, 0.27951812744140625, 0.2969818115234375, 0.31444549560546875, 0.3319091796875, 0.34937286376953125, 0.3668365478515625, 0.38430023193359375, 0.401763916015625, 0.41922760009765625, 0.4366912841796875, 0.45415496826171875, 0.47161865234375, 0.48908233642578125, 0.5065460205078125, 0.5240097045898438, 0.541473388671875, 0.5589370727539062, 0.5764007568359375, 0.5938644409179688, 0.611328125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 6.0, 9.0, 8.0, 13.0, 17.0, 21.0, 28.0, 30.0, 46.0, 50.0, 70.0, 105.0, 125.0, 125.0, 78.0, 53.0, 50.0, 40.0, 27.0, 26.0, 18.0, 10.0, 8.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.321044921875, -0.3117523193359375, -0.302459716796875, -0.2931671142578125, -0.28387451171875, -0.2745819091796875, -0.265289306640625, -0.2559967041015625, -0.2467041015625, -0.2374114990234375, -0.228118896484375, -0.2188262939453125, -0.20953369140625, -0.2002410888671875, -0.190948486328125, -0.1816558837890625, -0.17236328125, -0.1630706787109375, -0.153778076171875, -0.1444854736328125, -0.13519287109375, -0.1259002685546875, -0.116607666015625, -0.1073150634765625, -0.0980224609375, -0.0887298583984375, -0.079437255859375, -0.0701446533203125, -0.06085205078125, -0.0515594482421875, -0.042266845703125, -0.0329742431640625, -0.023681640625, -0.0143890380859375, -0.005096435546875, 0.0041961669921875, 0.01348876953125, 0.0227813720703125, 0.032073974609375, 0.0413665771484375, 0.0506591796875, 0.0599517822265625, 0.069244384765625, 0.0785369873046875, 0.08782958984375, 0.0971221923828125, 0.106414794921875, 0.1157073974609375, 0.125, 0.1342926025390625, 0.143585205078125, 0.1528778076171875, 0.16217041015625, 0.1714630126953125, 0.180755615234375, 0.1900482177734375, 0.1993408203125, 0.2086334228515625, 0.217926025390625, 0.2272186279296875, 0.23651123046875, 0.2458038330078125, 0.255096435546875, 0.2643890380859375, 0.273681640625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 14.0, 29.0, 120.0, 440.0, 288.0, 67.0, 22.0, 9.0, 11.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.458877563476562, -21.000242233276367, -20.541606903076172, -20.08297348022461, -19.624338150024414, -19.16570281982422, -18.707067489624023, -18.248432159423828, -17.789796829223633, -17.331161499023438, -16.872526168823242, -16.413890838623047, -15.955256462097168, -15.496622085571289, -15.037986755371094, -14.579351425170898, -14.12071704864502, -13.662081718444824, -13.203447341918945, -12.74481201171875, -12.286176681518555, -11.82754135131836, -11.36890697479248, -10.910271644592285, -10.451637268066406, -9.993001937866211, -9.534367561340332, -9.075732231140137, -8.617096900939941, -8.158462524414062, -7.699827194213867, -7.241191864013672, -6.782557010650635, -6.323922157287598, -5.865286827087402, -5.406651973724365, -4.948017120361328, -4.489381790161133, -4.030746936798096, -3.5721118450164795, -3.1134767532348633, -2.654841661453247, -2.196206569671631, -1.7375717163085938, -1.2789366245269775, -0.8203015327453613, -0.3616666793823242, 0.09696841239929199, 0.5556035041809082, 1.0142385959625244, 1.472873568534851, 1.9315085411071777, 2.390143632888794, 2.84877872467041, 3.3074135780334473, 3.7660486698150635, 4.22468376159668, 4.683318614959717, 5.141953945159912, 5.600588798522949, 6.0592241287231445, 6.517858982086182, 6.976493835449219, 7.435129165649414, 7.893764019012451]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 4.0, 8.0, 10.0, 12.0, 14.0, 16.0, 22.0, 28.0, 25.0, 40.0, 41.0, 45.0, 42.0, 46.0, 41.0, 52.0, 51.0, 53.0, 65.0, 45.0, 46.0, 45.0, 39.0, 28.0, 27.0, 21.0, 29.0, 19.0, 13.0, 23.0, 11.0, 10.0, 6.0, 12.0, 3.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-6.503831386566162, -6.293907165527344, -6.083983421325684, -5.874059200286865, -5.664135456085205, -5.454211235046387, -5.244287490844727, -5.034363269805908, -4.824439525604248, -4.61451530456543, -4.4045915603637695, -4.194667339324951, -3.984743595123291, -3.7748193740844727, -3.5648956298828125, -3.354971408843994, -3.145047426223755, -2.9351234436035156, -2.7251994609832764, -2.515275478363037, -2.305351495742798, -2.0954275131225586, -1.8855034112930298, -1.6755794286727905, -1.4656554460525513, -1.255731463432312, -1.0458074808120728, -0.8358834385871887, -0.6259594559669495, -0.41603541374206543, -0.20611143112182617, 0.003812551498413086, 0.21373653411865234, 0.4236605167388916, 0.6335844993591309, 0.8435085415840149, 1.0534324645996094, 1.2633565664291382, 1.4732805490493774, 1.6832045316696167, 1.893128514289856, 2.1030526161193848, 2.312976598739624, 2.5229005813598633, 2.7328245639801025, 2.942748546600342, 3.152672529220581, 3.3625965118408203, 3.5725204944610596, 3.782444477081299, 3.992368459701538, 4.202292442321777, 4.412216663360596, 4.622140407562256, 4.832064628601074, 5.041988372802734, 5.251912593841553, 5.461836814880371, 5.671760559082031, 5.88168478012085, 6.09160852432251, 6.301532745361328, 6.511456489562988, 6.721380710601807, 6.931304454803467]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 6.0, 5.0, 11.0, 10.0, 13.0, 29.0, 44.0, 73.0, 90.0, 162.0, 224.0, 452.0, 822.0, 1627.0, 3331.0, 8360.0, 25694.0, 124619.0, 2858370.0, 1060458.0, 78824.0, 18749.0, 6468.0, 2751.0, 1327.0, 696.0, 398.0, 213.0, 175.0, 90.0, 61.0, 52.0, 30.0, 18.0, 13.0, 5.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9794921875, -1.9084930419921875, -1.837493896484375, -1.7664947509765625, -1.69549560546875, -1.6244964599609375, -1.553497314453125, -1.4824981689453125, -1.4114990234375, -1.3404998779296875, -1.269500732421875, -1.1985015869140625, -1.12750244140625, -1.0565032958984375, -0.985504150390625, -0.9145050048828125, -0.843505859375, -0.7725067138671875, -0.701507568359375, -0.6305084228515625, -0.55950927734375, -0.4885101318359375, -0.417510986328125, -0.3465118408203125, -0.2755126953125, -0.2045135498046875, -0.133514404296875, -0.0625152587890625, 0.00848388671875, 0.0794830322265625, 0.150482177734375, 0.2214813232421875, 0.29248046875, 0.3634796142578125, 0.434478759765625, 0.5054779052734375, 0.57647705078125, 0.6474761962890625, 0.718475341796875, 0.7894744873046875, 0.8604736328125, 0.9314727783203125, 1.002471923828125, 1.0734710693359375, 1.14447021484375, 1.2154693603515625, 1.286468505859375, 1.3574676513671875, 1.428466796875, 1.4994659423828125, 1.570465087890625, 1.6414642333984375, 1.71246337890625, 1.7834625244140625, 1.854461669921875, 1.9254608154296875, 1.9964599609375, 2.0674591064453125, 2.138458251953125, 2.2094573974609375, 2.28045654296875, 2.3514556884765625, 2.422454833984375, 2.4934539794921875, 2.564453125]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 5.0, 1.0, 3.0, 9.0, 4.0, 9.0, 5.0, 13.0, 19.0, 24.0, 37.0, 36.0, 64.0, 78.0, 79.0, 91.0, 85.0, 92.0, 62.0, 65.0, 49.0, 42.0, 34.0, 28.0, 19.0, 10.0, 10.0, 9.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654296875, -1.593963623046875, -1.53363037109375, -1.473297119140625, -1.4129638671875, -1.352630615234375, -1.29229736328125, -1.231964111328125, -1.171630859375, -1.111297607421875, -1.05096435546875, -0.990631103515625, -0.9302978515625, -0.869964599609375, -0.80963134765625, -0.749298095703125, -0.68896484375, -0.628631591796875, -0.56829833984375, -0.507965087890625, -0.4476318359375, -0.387298583984375, -0.32696533203125, -0.266632080078125, -0.206298828125, -0.145965576171875, -0.08563232421875, -0.025299072265625, 0.0350341796875, 0.095367431640625, 0.15570068359375, 0.216033935546875, 0.2763671875, 0.336700439453125, 0.39703369140625, 0.457366943359375, 0.5177001953125, 0.578033447265625, 0.63836669921875, 0.698699951171875, 0.759033203125, 0.819366455078125, 0.87969970703125, 0.940032958984375, 1.0003662109375, 1.060699462890625, 1.12103271484375, 1.181365966796875, 1.24169921875, 1.302032470703125, 1.36236572265625, 1.422698974609375, 1.4830322265625, 1.543365478515625, 1.60369873046875, 1.664031982421875, 1.724365234375, 1.784698486328125, 1.84503173828125, 1.905364990234375, 1.9656982421875, 2.026031494140625, 2.08636474609375, 2.146697998046875, 2.20703125]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 3.0, 9.0, 19.0, 21.0, 27.0, 37.0, 65.0, 85.0, 208.0, 368.0, 819.0, 1960.0, 6276.0, 31812.0, 545448.0, 3519654.0, 71579.0, 10749.0, 2983.0, 1077.0, 467.0, 238.0, 135.0, 89.0, 49.0, 20.0, 23.0, 17.0, 14.0, 11.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.283203125, -3.187164306640625, -3.09112548828125, -2.995086669921875, -2.8990478515625, -2.803009033203125, -2.70697021484375, -2.610931396484375, -2.514892578125, -2.418853759765625, -2.32281494140625, -2.226776123046875, -2.1307373046875, -2.034698486328125, -1.93865966796875, -1.842620849609375, -1.74658203125, -1.650543212890625, -1.55450439453125, -1.458465576171875, -1.3624267578125, -1.266387939453125, -1.17034912109375, -1.074310302734375, -0.978271484375, -0.882232666015625, -0.78619384765625, -0.690155029296875, -0.5941162109375, -0.498077392578125, -0.40203857421875, -0.305999755859375, -0.2099609375, -0.113922119140625, -0.01788330078125, 0.078155517578125, 0.1741943359375, 0.270233154296875, 0.36627197265625, 0.462310791015625, 0.558349609375, 0.654388427734375, 0.75042724609375, 0.846466064453125, 0.9425048828125, 1.038543701171875, 1.13458251953125, 1.230621337890625, 1.32666015625, 1.422698974609375, 1.51873779296875, 1.614776611328125, 1.7108154296875, 1.806854248046875, 1.90289306640625, 1.998931884765625, 2.094970703125, 2.191009521484375, 2.28704833984375, 2.383087158203125, 2.4791259765625, 2.575164794921875, 2.67120361328125, 2.767242431640625, 2.86328125]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 12.0, 7.0, 14.0, 18.0, 36.0, 50.0, 60.0, 88.0, 148.0, 240.0, 557.0, 1312.0, 723.0, 319.0, 167.0, 89.0, 82.0, 52.0, 35.0, 22.0, 12.0, 7.0, 9.0, 1.0, 5.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6787109375, -0.6572799682617188, -0.6358489990234375, -0.6144180297851562, -0.592987060546875, -0.5715560913085938, -0.5501251220703125, -0.5286941528320312, -0.50726318359375, -0.48583221435546875, -0.4644012451171875, -0.44297027587890625, -0.421539306640625, -0.40010833740234375, -0.3786773681640625, -0.35724639892578125, -0.3358154296875, -0.31438446044921875, -0.2929534912109375, -0.27152252197265625, -0.250091552734375, -0.22866058349609375, -0.2072296142578125, -0.18579864501953125, -0.16436767578125, -0.14293670654296875, -0.1215057373046875, -0.10007476806640625, -0.078643798828125, -0.05721282958984375, -0.0357818603515625, -0.01435089111328125, 0.007080078125, 0.02851104736328125, 0.0499420166015625, 0.07137298583984375, 0.092803955078125, 0.11423492431640625, 0.1356658935546875, 0.15709686279296875, 0.17852783203125, 0.19995880126953125, 0.2213897705078125, 0.24282073974609375, 0.264251708984375, 0.28568267822265625, 0.3071136474609375, 0.32854461669921875, 0.3499755859375, 0.37140655517578125, 0.3928375244140625, 0.41426849365234375, 0.435699462890625, 0.45713043212890625, 0.4785614013671875, 0.49999237060546875, 0.52142333984375, 0.5428543090820312, 0.5642852783203125, 0.5857162475585938, 0.607147216796875, 0.6285781860351562, 0.6500091552734375, 0.6714401245117188, 0.69287109375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 6.0, 3.0, 6.0, 8.0, 20.0, 39.0, 82.0, 157.0, 222.0, 194.0, 128.0, 52.0, 22.0, 19.0, 9.0, 16.0, 8.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.906493186950684, -5.765346050262451, -5.624198913574219, -5.483051300048828, -5.341904163360596, -5.200757026672363, -5.059609889984131, -4.918462753295898, -4.777315139770508, -4.636168003082275, -4.495020866394043, -4.353873252868652, -4.21272611618042, -4.0715789794921875, -3.930431842803955, -3.7892847061157227, -3.6481375694274902, -3.506990432739258, -3.3658430576324463, -3.224695920944214, -3.0835485458374023, -2.94240140914917, -2.8012542724609375, -2.660107135772705, -2.5189597606658936, -2.377812623977661, -2.2366652488708496, -2.095518112182617, -1.9543708562850952, -1.8132236003875732, -1.6720764636993408, -1.5309292078018188, -1.3897817134857178, -1.2486344575881958, -1.1074872016906738, -0.9663400650024414, -0.8251928091049194, -0.6840455532073975, -0.5428983569145203, -0.40175116062164307, -0.2606039047241211, -0.11945667862892151, 0.021690547466278076, 0.16283777356147766, 0.30398499965667725, 0.4451322555541992, 0.5862794518470764, 0.7274266481399536, 0.8685739040374756, 1.0097211599349976, 1.1508684158325195, 1.292015552520752, 1.433162808418274, 1.574310064315796, 1.7154572010040283, 1.8566044569015503, 1.9977517127990723, 2.1388988494873047, 2.280046224594116, 2.4211933612823486, 2.56234073638916, 2.7034878730773926, 2.844635009765625, 2.9857821464538574, 3.126929521560669]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 2.0, 2.0, 7.0, 5.0, 6.0, 11.0, 11.0, 14.0, 16.0, 28.0, 31.0, 41.0, 25.0, 55.0, 47.0, 56.0, 72.0, 71.0, 61.0, 66.0, 65.0, 60.0, 37.0, 36.0, 36.0, 34.0, 26.0, 20.0, 10.0, 9.0, 7.0, 14.0, 9.0, 4.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5737828016281128, -1.5160099267959595, -1.4582370519638062, -1.4004642963409424, -1.342691421508789, -1.2849185466766357, -1.2271456718444824, -1.169372797012329, -1.1115999221801758, -1.0538270473480225, -0.9960542321205139, -0.9382813572883606, -0.880508542060852, -0.8227356672286987, -0.7649627923965454, -0.7071899175643921, -0.6494171619415283, -0.591644287109375, -0.5338714718818665, -0.47609859704971313, -0.4183257520198822, -0.36055290699005127, -0.30278003215789795, -0.24500718712806702, -0.18723434209823608, -0.12946149706840515, -0.07168863713741302, -0.013915777206420898, 0.043857067823410034, 0.10162991285324097, 0.1594027876853943, 0.21717563271522522, 0.2749483585357666, 0.33272120356559753, 0.39049404859542847, 0.4482669234275818, 0.5060397386550903, 0.5638126134872437, 0.621585488319397, 0.6793583631515503, 0.7371311783790588, 0.7949040532112122, 0.8526768684387207, 0.910449743270874, 0.9682226181030273, 1.0259954929351807, 1.083768367767334, 1.1415411233901978, 1.199313998222351, 1.2570868730545044, 1.3148597478866577, 1.3726325035095215, 1.4304053783416748, 1.4881782531738281, 1.5459511280059814, 1.6037240028381348, 1.661496877670288, 1.7192697525024414, 1.7770426273345947, 1.834815502166748, 1.8925882577896118, 1.9503611326217651, 2.008133888244629, 2.0659067630767822, 2.1236796379089355]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 5.0, 3.0, 9.0, 8.0, 9.0, 17.0, 31.0, 40.0, 60.0, 83.0, 141.0, 273.0, 549.0, 1084.0, 2783.0, 8830.0, 39571.0, 414183.0, 518576.0, 46940.0, 9861.0, 3021.0, 1186.0, 560.0, 301.0, 157.0, 94.0, 65.0, 40.0, 21.0, 20.0, 12.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.2312450408935547, -0.22445297241210938, -0.21766090393066406, -0.21086883544921875, -0.20407676696777344, -0.19728469848632812, -0.1904926300048828, -0.1837005615234375, -0.1769084930419922, -0.17011642456054688, -0.16332435607910156, -0.15653228759765625, -0.14974021911621094, -0.14294815063476562, -0.1361560821533203, -0.129364013671875, -0.12257194519042969, -0.11577987670898438, -0.10898780822753906, -0.10219573974609375, -0.09540367126464844, -0.08861160278320312, -0.08181953430175781, -0.0750274658203125, -0.06823539733886719, -0.061443328857421875, -0.05465126037597656, -0.04785919189453125, -0.04106712341308594, -0.034275054931640625, -0.027482986450195312, -0.02069091796875, -0.013898849487304688, -0.007106781005859375, -0.0003147125244140625, 0.00647735595703125, 0.013269424438476562, 0.020061492919921875, 0.026853561401367188, 0.0336456298828125, 0.04043769836425781, 0.047229766845703125, 0.05402183532714844, 0.06081390380859375, 0.06760597229003906, 0.07439804077148438, 0.08119010925292969, 0.087982177734375, 0.09477424621582031, 0.10156631469726562, 0.10835838317871094, 0.11515045166015625, 0.12194252014160156, 0.12873458862304688, 0.1355266571044922, 0.1423187255859375, 0.1491107940673828, 0.15590286254882812, 0.16269493103027344, 0.16948699951171875, 0.17627906799316406, 0.18307113647460938, 0.1898632049560547, 0.1966552734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 5.0, 9.0, 4.0, 8.0, 7.0, 16.0, 17.0, 21.0, 28.0, 57.0, 60.0, 72.0, 75.0, 84.0, 89.0, 89.0, 74.0, 62.0, 49.0, 49.0, 35.0, 18.0, 14.0, 15.0, 15.0, 8.0, 8.0, 1.0, 5.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4140625, -1.3656158447265625, -1.317169189453125, -1.2687225341796875, -1.22027587890625, -1.1718292236328125, -1.123382568359375, -1.0749359130859375, -1.0264892578125, -0.9780426025390625, -0.929595947265625, -0.8811492919921875, -0.83270263671875, -0.7842559814453125, -0.735809326171875, -0.6873626708984375, -0.638916015625, -0.5904693603515625, -0.542022705078125, -0.4935760498046875, -0.44512939453125, -0.3966827392578125, -0.348236083984375, -0.2997894287109375, -0.2513427734375, -0.2028961181640625, -0.154449462890625, -0.1060028076171875, -0.05755615234375, -0.0091094970703125, 0.039337158203125, 0.0877838134765625, 0.13623046875, 0.1846771240234375, 0.233123779296875, 0.2815704345703125, 0.33001708984375, 0.3784637451171875, 0.426910400390625, 0.4753570556640625, 0.5238037109375, 0.5722503662109375, 0.620697021484375, 0.6691436767578125, 0.71759033203125, 0.7660369873046875, 0.814483642578125, 0.8629302978515625, 0.911376953125, 0.9598236083984375, 1.008270263671875, 1.0567169189453125, 1.10516357421875, 1.1536102294921875, 1.202056884765625, 1.2505035400390625, 1.2989501953125, 1.3473968505859375, 1.395843505859375, 1.4442901611328125, 1.49273681640625, 1.5411834716796875, 1.589630126953125, 1.6380767822265625, 1.6865234375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 7.0, 5.0, 9.0, 13.0, 5.0, 15.0, 14.0, 16.0, 20.0, 33.0, 48.0, 51.0, 61.0, 85.0, 112.0, 149.0, 221.0, 330.0, 597.0, 1674.0, 7520.0, 62003.0, 665243.0, 282469.0, 22150.0, 3363.0, 932.0, 373.0, 244.0, 179.0, 137.0, 113.0, 76.0, 69.0, 54.0, 36.0, 28.0, 29.0, 20.0, 12.0, 7.0, 8.0, 5.0, 7.0, 4.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.181884765625, -0.1761646270751953, -0.17044448852539062, -0.16472434997558594, -0.15900421142578125, -0.15328407287597656, -0.14756393432617188, -0.1418437957763672, -0.1361236572265625, -0.1304035186767578, -0.12468338012695312, -0.11896324157714844, -0.11324310302734375, -0.10752296447753906, -0.10180282592773438, -0.09608268737792969, -0.090362548828125, -0.08464241027832031, -0.07892227172851562, -0.07320213317871094, -0.06748199462890625, -0.06176185607910156, -0.056041717529296875, -0.05032157897949219, -0.0446014404296875, -0.03888130187988281, -0.033161163330078125, -0.027441024780273438, -0.02172088623046875, -0.016000747680664062, -0.010280609130859375, -0.0045604705810546875, 0.00115966796875, 0.0068798065185546875, 0.012599945068359375, 0.018320083618164062, 0.02404022216796875, 0.029760360717773438, 0.035480499267578125, 0.04120063781738281, 0.0469207763671875, 0.05264091491699219, 0.058361053466796875, 0.06408119201660156, 0.06980133056640625, 0.07552146911621094, 0.08124160766601562, 0.08696174621582031, 0.092681884765625, 0.09840202331542969, 0.10412216186523438, 0.10984230041503906, 0.11556243896484375, 0.12128257751464844, 0.12700271606445312, 0.1327228546142578, 0.1384429931640625, 0.1441631317138672, 0.14988327026367188, 0.15560340881347656, 0.16132354736328125, 0.16704368591308594, 0.17276382446289062, 0.1784839630126953, 0.1842041015625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 2.0, 1.0, 4.0, 1.0, 7.0, 9.0, 7.0, 10.0, 12.0, 26.0, 25.0, 21.0, 35.0, 26.0, 35.0, 32.0, 55.0, 48.0, 66.0, 60.0, 52.0, 58.0, 53.0, 48.0, 50.0, 35.0, 28.0, 36.0, 39.0, 25.0, 21.0, 16.0, 14.0, 12.0, 8.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.111328125, -2.0447998046875, -1.978271484375, -1.9117431640625, -1.84521484375, -1.7786865234375, -1.712158203125, -1.6456298828125, -1.5791015625, -1.5125732421875, -1.446044921875, -1.3795166015625, -1.31298828125, -1.2464599609375, -1.179931640625, -1.1134033203125, -1.046875, -0.9803466796875, -0.913818359375, -0.8472900390625, -0.78076171875, -0.7142333984375, -0.647705078125, -0.5811767578125, -0.5146484375, -0.4481201171875, -0.381591796875, -0.3150634765625, -0.24853515625, -0.1820068359375, -0.115478515625, -0.0489501953125, 0.017578125, 0.0841064453125, 0.150634765625, 0.2171630859375, 0.28369140625, 0.3502197265625, 0.416748046875, 0.4832763671875, 0.5498046875, 0.6163330078125, 0.682861328125, 0.7493896484375, 0.81591796875, 0.8824462890625, 0.948974609375, 1.0155029296875, 1.08203125, 1.1485595703125, 1.215087890625, 1.2816162109375, 1.34814453125, 1.4146728515625, 1.481201171875, 1.5477294921875, 1.6142578125, 1.6807861328125, 1.747314453125, 1.8138427734375, 1.88037109375, 1.9468994140625, 2.013427734375, 2.0799560546875, 2.146484375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 2.0, 3.0, 4.0, 3.0, 8.0, 7.0, 9.0, 13.0, 10.0, 20.0, 31.0, 43.0, 56.0, 114.0, 141.0, 277.0, 673.0, 3034.0, 64465.0, 969343.0, 7981.0, 1325.0, 419.0, 192.0, 106.0, 77.0, 61.0, 38.0, 18.0, 13.0, 12.0, 8.0, 8.0, 8.0, 7.0, 4.0, 5.0, 2.0, 1.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.06475830078125, -0.06297063827514648, -0.06118297576904297, -0.05939531326293945, -0.05760765075683594, -0.05581998825073242, -0.054032325744628906, -0.05224466323852539, -0.050457000732421875, -0.04866933822631836, -0.046881675720214844, -0.04509401321411133, -0.04330635070800781, -0.0415186882019043, -0.03973102569580078, -0.037943363189697266, -0.03615570068359375, -0.034368038177490234, -0.03258037567138672, -0.030792713165283203, -0.029005050659179688, -0.027217388153076172, -0.025429725646972656, -0.02364206314086914, -0.021854400634765625, -0.02006673812866211, -0.018279075622558594, -0.016491413116455078, -0.014703750610351562, -0.012916088104248047, -0.011128425598144531, -0.009340763092041016, -0.0075531005859375, -0.005765438079833984, -0.003977775573730469, -0.002190113067626953, -0.0004024505615234375, 0.0013852119445800781, 0.0031728744506835938, 0.004960536956787109, 0.006748199462890625, 0.00853586196899414, 0.010323524475097656, 0.012111186981201172, 0.013898849487304688, 0.015686511993408203, 0.01747417449951172, 0.019261837005615234, 0.02104949951171875, 0.022837162017822266, 0.02462482452392578, 0.026412487030029297, 0.028200149536132812, 0.029987812042236328, 0.031775474548339844, 0.03356313705444336, 0.035350799560546875, 0.03713846206665039, 0.038926124572753906, 0.04071378707885742, 0.04250144958496094, 0.04428911209106445, 0.04607677459716797, 0.047864437103271484, 0.049652099609375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 6.0, 7.0, 9.0, 6.0, 16.0, 18.0, 34.0, 35.0, 58.0, 91.0, 105.0, 147.0, 143.0, 96.0, 80.0, 41.0, 31.0, 19.0, 12.0, 10.0, 7.0, 8.0, 5.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.1457672119140625e-05, -2.0944513380527496e-05, -2.0431354641914368e-05, -1.991819590330124e-05, -1.940503716468811e-05, -1.889187842607498e-05, -1.8378719687461853e-05, -1.7865560948848724e-05, -1.7352402210235596e-05, -1.6839243471622467e-05, -1.632608473300934e-05, -1.581292599439621e-05, -1.529976725578308e-05, -1.4786608517169952e-05, -1.4273449778556824e-05, -1.3760291039943695e-05, -1.3247132301330566e-05, -1.2733973562717438e-05, -1.2220814824104309e-05, -1.170765608549118e-05, -1.1194497346878052e-05, -1.0681338608264923e-05, -1.0168179869651794e-05, -9.655021131038666e-06, -9.141862392425537e-06, -8.628703653812408e-06, -8.11554491519928e-06, -7.602386176586151e-06, -7.0892274379730225e-06, -6.576068699359894e-06, -6.062909960746765e-06, -5.5497512221336365e-06, -5.036592483520508e-06, -4.523433744907379e-06, -4.0102750062942505e-06, -3.497116267681122e-06, -2.983957529067993e-06, -2.4707987904548645e-06, -1.957640051841736e-06, -1.4444813132286072e-06, -9.313225746154785e-07, -4.1816383600234985e-07, 9.499490261077881e-08, 6.081536412239075e-07, 1.1213123798370361e-06, 1.6344711184501648e-06, 2.1476298570632935e-06, 2.660788595676422e-06, 3.1739473342895508e-06, 3.6871060729026794e-06, 4.200264811515808e-06, 4.713423550128937e-06, 5.2265822887420654e-06, 5.739741027355194e-06, 6.252899765968323e-06, 6.766058504581451e-06, 7.27921724319458e-06, 7.792375981807709e-06, 8.305534720420837e-06, 8.818693459033966e-06, 9.331852197647095e-06, 9.845010936260223e-06, 1.0358169674873352e-05, 1.087132841348648e-05, 1.138448715209961e-05]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 0.0, 3.0, 4.0, 4.0, 12.0, 14.0, 24.0, 25.0, 32.0, 42.0, 76.0, 114.0, 154.0, 260.0, 427.0, 731.0, 1400.0, 2876.0, 7760.0, 30621.0, 591459.0, 372794.0, 26651.0, 7158.0, 2825.0, 1336.0, 669.0, 399.0, 217.0, 154.0, 95.0, 65.0, 44.0, 29.0, 16.0, 12.0, 16.0, 9.0, 10.0, 5.0, 2.0, 3.0, 4.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042816162109375, -0.04147624969482422, -0.04013633728027344, -0.038796424865722656, -0.037456512451171875, -0.036116600036621094, -0.03477668762207031, -0.03343677520751953, -0.03209686279296875, -0.03075695037841797, -0.029417037963867188, -0.028077125549316406, -0.026737213134765625, -0.025397300720214844, -0.024057388305664062, -0.02271747589111328, -0.0213775634765625, -0.02003765106201172, -0.018697738647460938, -0.017357826232910156, -0.016017913818359375, -0.014678001403808594, -0.013338088989257812, -0.011998176574707031, -0.01065826416015625, -0.009318351745605469, -0.007978439331054688, -0.006638526916503906, -0.005298614501953125, -0.003958702087402344, -0.0026187896728515625, -0.0012788772583007812, 6.103515625e-05, 0.0014009475708007812, 0.0027408599853515625, 0.004080772399902344, 0.005420684814453125, 0.006760597229003906, 0.008100509643554688, 0.009440422058105469, 0.01078033447265625, 0.012120246887207031, 0.013460159301757812, 0.014800071716308594, 0.016139984130859375, 0.017479896545410156, 0.018819808959960938, 0.02015972137451172, 0.0214996337890625, 0.02283954620361328, 0.024179458618164062, 0.025519371032714844, 0.026859283447265625, 0.028199195861816406, 0.029539108276367188, 0.03087902069091797, 0.03221893310546875, 0.03355884552001953, 0.03489875793457031, 0.036238670349121094, 0.037578582763671875, 0.038918495178222656, 0.04025840759277344, 0.04159832000732422, 0.042938232421875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 11.0, 13.0, 14.0, 42.0, 51.0, 89.0, 203.0, 285.0, 79.0, 41.0, 37.0, 28.0, 22.0, 17.0, 6.0, 8.0, 7.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01181793212890625, -0.011461019515991211, -0.011104106903076172, -0.010747194290161133, -0.010390281677246094, -0.010033369064331055, -0.009676456451416016, -0.009319543838500977, -0.008962631225585938, -0.008605718612670898, -0.00824880599975586, -0.00789189338684082, -0.007534980773925781, -0.007178068161010742, -0.006821155548095703, -0.006464242935180664, -0.006107330322265625, -0.005750417709350586, -0.005393505096435547, -0.005036592483520508, -0.004679679870605469, -0.00432276725769043, -0.003965854644775391, -0.0036089420318603516, -0.0032520294189453125, -0.0028951168060302734, -0.0025382041931152344, -0.0021812915802001953, -0.0018243789672851562, -0.0014674663543701172, -0.0011105537414550781, -0.0007536411285400391, -0.000396728515625, -3.981590270996094e-05, 0.0003170967102050781, 0.0006740093231201172, 0.0010309219360351562, 0.0013878345489501953, 0.0017447471618652344, 0.0021016597747802734, 0.0024585723876953125, 0.0028154850006103516, 0.0031723976135253906, 0.0035293102264404297, 0.0038862228393554688, 0.004243135452270508, 0.004600048065185547, 0.004956960678100586, 0.005313873291015625, 0.005670785903930664, 0.006027698516845703, 0.006384611129760742, 0.006741523742675781, 0.00709843635559082, 0.007455348968505859, 0.0078122615814208984, 0.008169174194335938, 0.008526086807250977, 0.008882999420166016, 0.009239912033081055, 0.009596824645996094, 0.009953737258911133, 0.010310649871826172, 0.010667562484741211, 0.01102447509765625]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 5.0, 8.0, 26.0, 39.0, 110.0, 270.0, 283.0, 144.0, 45.0, 21.0, 14.0, 11.0, 13.0, 7.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.824275493621826, -4.7041215896606445, -4.583967685699463, -4.463813781738281, -4.343660354614258, -4.223506450653076, -4.1033525466918945, -3.983198642730713, -3.8630449771881104, -3.7428910732269287, -3.622737407684326, -3.5025835037231445, -3.382429599761963, -3.2622759342193604, -3.1421220302581787, -3.021968364715576, -2.9018144607543945, -2.781660556793213, -2.6615068912506104, -2.5413529872894287, -2.421199083328247, -2.3010454177856445, -2.180891513824463, -2.0607376098632812, -1.9405837059020996, -1.8204299211502075, -1.7002760171890259, -1.5801222324371338, -1.4599684476852417, -1.3398146629333496, -1.219660758972168, -1.0995069742202759, -0.9793531894683838, -0.8591993451118469, -0.7390455603599548, -0.618891716003418, -0.4987379014492035, -0.378584086894989, -0.25843024253845215, -0.13827645778656006, -0.018122613430023193, 0.10203120857477188, 0.22218503057956696, 0.3423388600349426, 0.4624926745891571, 0.5826464891433716, 0.7028003334999084, 0.8229541182518005, 0.9431079626083374, 1.0632617473602295, 1.1834156513214111, 1.3035694360733032, 1.4237232208251953, 1.543877124786377, 1.664030909538269, 1.7841846942901611, 1.9043385982513428, 2.0244925022125244, 2.144646167755127, 2.2648000717163086, 2.3849539756774902, 2.5051076412200928, 2.6252615451812744, 2.745415210723877, 2.8655691146850586]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 2.0, 5.0, 11.0, 7.0, 11.0, 16.0, 19.0, 29.0, 34.0, 51.0, 63.0, 58.0, 96.0, 96.0, 83.0, 86.0, 88.0, 43.0, 51.0, 41.0, 26.0, 20.0, 15.0, 10.0, 12.0, 10.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3058565855026245, -1.257638931274414, -1.2094212770462036, -1.1612036228179932, -1.1129859685897827, -1.0647683143615723, -1.0165506601333618, -0.9683330059051514, -0.9201153516769409, -0.8718976974487305, -0.82368004322052, -0.7754623889923096, -0.7272447347640991, -0.6790270805358887, -0.6308094263076782, -0.5825917720794678, -0.5343741774559021, -0.48615652322769165, -0.4379388689994812, -0.38972121477127075, -0.3415035605430603, -0.29328590631484985, -0.2450682818889618, -0.19685062766075134, -0.1486329734325409, -0.10041531920433044, -0.05219767242670059, -0.00398002564907074, 0.04423762857913971, 0.09245528280735016, 0.14067292213439941, 0.18889057636260986, 0.2371082305908203, 0.28532588481903076, 0.3335435390472412, 0.38176119327545166, 0.4299788475036621, 0.47819650173187256, 0.526414155960083, 0.5746318101882935, 0.6228494644165039, 0.6710671186447144, 0.7192847728729248, 0.7675024271011353, 0.8157200813293457, 0.8639377355575562, 0.9121553897857666, 0.960373044013977, 1.0085906982421875, 1.056808352470398, 1.1050260066986084, 1.1532436609268188, 1.2014613151550293, 1.2496789693832397, 1.2978966236114502, 1.3461142778396606, 1.3943318128585815, 1.442549467086792, 1.4907671213150024, 1.538984775543213, 1.5872024297714233, 1.6354200839996338, 1.6836377382278442, 1.7318553924560547, 1.7800730466842651]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 9.0, 16.0, 24.0, 39.0, 69.0, 106.0, 188.0, 318.0, 599.0, 1199.0, 2651.0, 6377.0, 17603.0, 61695.0, 296721.0, 510820.0, 105893.0, 27850.0, 9357.0, 3714.0, 1607.0, 724.0, 366.0, 220.0, 132.0, 83.0, 62.0, 26.0, 22.0, 16.0, 12.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.04296875, -1.0084228515625, -0.973876953125, -0.9393310546875, -0.90478515625, -0.8702392578125, -0.835693359375, -0.8011474609375, -0.7666015625, -0.7320556640625, -0.697509765625, -0.6629638671875, -0.62841796875, -0.5938720703125, -0.559326171875, -0.5247802734375, -0.490234375, -0.4556884765625, -0.421142578125, -0.3865966796875, -0.35205078125, -0.3175048828125, -0.282958984375, -0.2484130859375, -0.2138671875, -0.1793212890625, -0.144775390625, -0.1102294921875, -0.07568359375, -0.0411376953125, -0.006591796875, 0.0279541015625, 0.0625, 0.0970458984375, 0.131591796875, 0.1661376953125, 0.20068359375, 0.2352294921875, 0.269775390625, 0.3043212890625, 0.3388671875, 0.3734130859375, 0.407958984375, 0.4425048828125, 0.47705078125, 0.5115966796875, 0.546142578125, 0.5806884765625, 0.615234375, 0.6497802734375, 0.684326171875, 0.7188720703125, 0.75341796875, 0.7879638671875, 0.822509765625, 0.8570556640625, 0.8916015625, 0.9261474609375, 0.960693359375, 0.9952392578125, 1.02978515625, 1.0643310546875, 1.098876953125, 1.1334228515625, 1.16796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 9.0, 6.0, 6.0, 12.0, 13.0, 18.0, 21.0, 28.0, 36.0, 59.0, 63.0, 64.0, 85.0, 89.0, 90.0, 86.0, 75.0, 56.0, 46.0, 37.0, 23.0, 23.0, 11.0, 13.0, 6.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.625, -3.5108642578125, -3.396728515625, -3.2825927734375, -3.16845703125, -3.0543212890625, -2.940185546875, -2.8260498046875, -2.7119140625, -2.5977783203125, -2.483642578125, -2.3695068359375, -2.25537109375, -2.1412353515625, -2.027099609375, -1.9129638671875, -1.798828125, -1.6846923828125, -1.570556640625, -1.4564208984375, -1.34228515625, -1.2281494140625, -1.114013671875, -0.9998779296875, -0.8857421875, -0.7716064453125, -0.657470703125, -0.5433349609375, -0.42919921875, -0.3150634765625, -0.200927734375, -0.0867919921875, 0.02734375, 0.1414794921875, 0.255615234375, 0.3697509765625, 0.48388671875, 0.5980224609375, 0.712158203125, 0.8262939453125, 0.9404296875, 1.0545654296875, 1.168701171875, 1.2828369140625, 1.39697265625, 1.5111083984375, 1.625244140625, 1.7393798828125, 1.853515625, 1.9676513671875, 2.081787109375, 2.1959228515625, 2.31005859375, 2.4241943359375, 2.538330078125, 2.6524658203125, 2.7666015625, 2.8807373046875, 2.994873046875, 3.1090087890625, 3.22314453125, 3.3372802734375, 3.451416015625, 3.5655517578125, 3.6796875]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 3.0, 3.0, 4.0, 6.0, 13.0, 8.0, 6.0, 19.0, 17.0, 25.0, 24.0, 44.0, 39.0, 53.0, 83.0, 95.0, 136.0, 244.0, 347.0, 568.0, 1141.0, 2449.0, 6245.0, 18610.0, 70094.0, 351824.0, 467346.0, 91978.0, 23400.0, 7518.0, 2986.0, 1358.0, 666.0, 360.0, 226.0, 190.0, 111.0, 76.0, 62.0, 38.0, 32.0, 33.0, 18.0, 15.0, 11.0, 6.0, 10.0, 5.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.8115234375, -0.7862396240234375, -0.760955810546875, -0.7356719970703125, -0.71038818359375, -0.6851043701171875, -0.659820556640625, -0.6345367431640625, -0.6092529296875, -0.5839691162109375, -0.558685302734375, -0.5334014892578125, -0.50811767578125, -0.4828338623046875, -0.457550048828125, -0.4322662353515625, -0.406982421875, -0.3816986083984375, -0.356414794921875, -0.3311309814453125, -0.30584716796875, -0.2805633544921875, -0.255279541015625, -0.2299957275390625, -0.2047119140625, -0.1794281005859375, -0.154144287109375, -0.1288604736328125, -0.10357666015625, -0.0782928466796875, -0.053009033203125, -0.0277252197265625, -0.00244140625, 0.0228424072265625, 0.048126220703125, 0.0734100341796875, 0.09869384765625, 0.1239776611328125, 0.149261474609375, 0.1745452880859375, 0.1998291015625, 0.2251129150390625, 0.250396728515625, 0.2756805419921875, 0.30096435546875, 0.3262481689453125, 0.351531982421875, 0.3768157958984375, 0.402099609375, 0.4273834228515625, 0.452667236328125, 0.4779510498046875, 0.50323486328125, 0.5285186767578125, 0.553802490234375, 0.5790863037109375, 0.6043701171875, 0.6296539306640625, 0.654937744140625, 0.6802215576171875, 0.70550537109375, 0.7307891845703125, 0.756072998046875, 0.7813568115234375, 0.806640625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 11.0, 3.0, 6.0, 11.0, 15.0, 13.0, 12.0, 17.0, 18.0, 22.0, 16.0, 24.0, 24.0, 28.0, 43.0, 37.0, 42.0, 40.0, 32.0, 36.0, 30.0, 47.0, 44.0, 39.0, 50.0, 28.0, 34.0, 30.0, 37.0, 26.0, 33.0, 28.0, 23.0, 17.0, 23.0, 14.0, 11.0, 8.0, 6.0, 7.0, 8.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.90625, -2.821929931640625, -2.73760986328125, -2.653289794921875, -2.5689697265625, -2.484649658203125, -2.40032958984375, -2.316009521484375, -2.231689453125, -2.147369384765625, -2.06304931640625, -1.978729248046875, -1.8944091796875, -1.810089111328125, -1.72576904296875, -1.641448974609375, -1.55712890625, -1.472808837890625, -1.38848876953125, -1.304168701171875, -1.2198486328125, -1.135528564453125, -1.05120849609375, -0.966888427734375, -0.882568359375, -0.798248291015625, -0.71392822265625, -0.629608154296875, -0.5452880859375, -0.460968017578125, -0.37664794921875, -0.292327880859375, -0.2080078125, -0.123687744140625, -0.03936767578125, 0.044952392578125, 0.1292724609375, 0.213592529296875, 0.29791259765625, 0.382232666015625, 0.466552734375, 0.550872802734375, 0.63519287109375, 0.719512939453125, 0.8038330078125, 0.888153076171875, 0.97247314453125, 1.056793212890625, 1.14111328125, 1.225433349609375, 1.30975341796875, 1.394073486328125, 1.4783935546875, 1.562713623046875, 1.64703369140625, 1.731353759765625, 1.815673828125, 1.899993896484375, 1.98431396484375, 2.068634033203125, 2.1529541015625, 2.237274169921875, 2.32159423828125, 2.405914306640625, 2.490234375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 4.0, 7.0, 10.0, 16.0, 13.0, 30.0, 45.0, 46.0, 93.0, 156.0, 236.0, 428.0, 870.0, 1929.0, 5701.0, 26337.0, 266525.0, 676702.0, 54447.0, 9577.0, 2864.0, 1118.0, 586.0, 324.0, 158.0, 93.0, 74.0, 40.0, 33.0, 16.0, 13.0, 10.0, 9.0, 11.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.5947265625, -0.5768051147460938, -0.5588836669921875, -0.5409622192382812, -0.523040771484375, -0.5051193237304688, -0.4871978759765625, -0.46927642822265625, -0.45135498046875, -0.43343353271484375, -0.4155120849609375, -0.39759063720703125, -0.379669189453125, -0.36174774169921875, -0.3438262939453125, -0.32590484619140625, -0.3079833984375, -0.29006195068359375, -0.2721405029296875, -0.25421905517578125, -0.236297607421875, -0.21837615966796875, -0.2004547119140625, -0.18253326416015625, -0.16461181640625, -0.14669036865234375, -0.1287689208984375, -0.11084747314453125, -0.092926025390625, -0.07500457763671875, -0.0570831298828125, -0.03916168212890625, -0.021240234375, -0.00331878662109375, 0.0146026611328125, 0.03252410888671875, 0.050445556640625, 0.06836700439453125, 0.0862884521484375, 0.10420989990234375, 0.12213134765625, 0.14005279541015625, 0.1579742431640625, 0.17589569091796875, 0.193817138671875, 0.21173858642578125, 0.2296600341796875, 0.24758148193359375, 0.2655029296875, 0.28342437744140625, 0.3013458251953125, 0.31926727294921875, 0.337188720703125, 0.35511016845703125, 0.3730316162109375, 0.39095306396484375, 0.40887451171875, 0.42679595947265625, 0.4447174072265625, 0.46263885498046875, 0.480560302734375, 0.49848175048828125, 0.5164031982421875, 0.5343246459960938, 0.55224609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 3.0, 6.0, 7.0, 4.0, 3.0, 12.0, 12.0, 14.0, 24.0, 29.0, 39.0, 54.0, 87.0, 127.0, 130.0, 139.0, 101.0, 53.0, 44.0, 31.0, 16.0, 14.0, 15.0, 13.0, 5.0, 10.0, 5.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.930133819580078e-05, -9.665079414844513e-05, -9.400025010108948e-05, -9.134970605373383e-05, -8.869916200637817e-05, -8.604861795902252e-05, -8.339807391166687e-05, -8.074752986431122e-05, -7.809698581695557e-05, -7.544644176959991e-05, -7.279589772224426e-05, -7.014535367488861e-05, -6.749480962753296e-05, -6.484426558017731e-05, -6.219372153282166e-05, -5.9543177485466003e-05, -5.689263343811035e-05, -5.42420893907547e-05, -5.159154534339905e-05, -4.8941001296043396e-05, -4.6290457248687744e-05, -4.363991320133209e-05, -4.098936915397644e-05, -3.833882510662079e-05, -3.568828105926514e-05, -3.3037737011909485e-05, -3.0387192964553833e-05, -2.773664891719818e-05, -2.508610486984253e-05, -2.2435560822486877e-05, -1.9785016775131226e-05, -1.7134472727775574e-05, -1.4483928680419922e-05, -1.183338463306427e-05, -9.182840585708618e-06, -6.532296538352966e-06, -3.8817524909973145e-06, -1.2312084436416626e-06, 1.4193356037139893e-06, 4.069879651069641e-06, 6.720423698425293e-06, 9.370967745780945e-06, 1.2021511793136597e-05, 1.4672055840492249e-05, 1.73225998878479e-05, 1.9973143935203552e-05, 2.2623687982559204e-05, 2.5274232029914856e-05, 2.7924776077270508e-05, 3.057532012462616e-05, 3.322586417198181e-05, 3.587640821933746e-05, 3.8526952266693115e-05, 4.117749631404877e-05, 4.382804036140442e-05, 4.647858440876007e-05, 4.912912845611572e-05, 5.1779672503471375e-05, 5.4430216550827026e-05, 5.708076059818268e-05, 5.973130464553833e-05, 6.238184869289398e-05, 6.503239274024963e-05, 6.768293678760529e-05, 7.033348083496094e-05]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 0.0, 1.0, 4.0, 5.0, 4.0, 4.0, 6.0, 7.0, 6.0, 17.0, 22.0, 41.0, 63.0, 125.0, 245.0, 482.0, 1085.0, 2676.0, 9215.0, 55644.0, 738051.0, 211016.0, 21712.0, 4970.0, 1691.0, 675.0, 362.0, 177.0, 90.0, 53.0, 29.0, 19.0, 11.0, 13.0, 3.0, 9.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6298828125, -0.6087188720703125, -0.587554931640625, -0.5663909912109375, -0.54522705078125, -0.5240631103515625, -0.502899169921875, -0.4817352294921875, -0.4605712890625, -0.4394073486328125, -0.418243408203125, -0.3970794677734375, -0.37591552734375, -0.3547515869140625, -0.333587646484375, -0.3124237060546875, -0.291259765625, -0.2700958251953125, -0.248931884765625, -0.2277679443359375, -0.20660400390625, -0.1854400634765625, -0.164276123046875, -0.1431121826171875, -0.1219482421875, -0.1007843017578125, -0.079620361328125, -0.0584564208984375, -0.03729248046875, -0.0161285400390625, 0.005035400390625, 0.0261993408203125, 0.04736328125, 0.0685272216796875, 0.089691162109375, 0.1108551025390625, 0.13201904296875, 0.1531829833984375, 0.174346923828125, 0.1955108642578125, 0.2166748046875, 0.2378387451171875, 0.259002685546875, 0.2801666259765625, 0.30133056640625, 0.3224945068359375, 0.343658447265625, 0.3648223876953125, 0.385986328125, 0.4071502685546875, 0.428314208984375, 0.4494781494140625, 0.47064208984375, 0.4918060302734375, 0.512969970703125, 0.5341339111328125, 0.5552978515625, 0.5764617919921875, 0.597625732421875, 0.6187896728515625, 0.63995361328125, 0.6611175537109375, 0.682281494140625, 0.7034454345703125, 0.724609375]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 13.0, 8.0, 17.0, 22.0, 45.0, 51.0, 96.0, 166.0, 193.0, 148.0, 84.0, 48.0, 38.0, 23.0, 18.0, 10.0, 8.0, 6.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4345703125, -0.42194366455078125, -0.4093170166015625, -0.39669036865234375, -0.384063720703125, -0.37143707275390625, -0.3588104248046875, -0.34618377685546875, -0.33355712890625, -0.32093048095703125, -0.3083038330078125, -0.29567718505859375, -0.283050537109375, -0.27042388916015625, -0.2577972412109375, -0.24517059326171875, -0.2325439453125, -0.21991729736328125, -0.2072906494140625, -0.19466400146484375, -0.182037353515625, -0.16941070556640625, -0.1567840576171875, -0.14415740966796875, -0.13153076171875, -0.11890411376953125, -0.1062774658203125, -0.09365081787109375, -0.081024169921875, -0.06839752197265625, -0.0557708740234375, -0.04314422607421875, -0.030517578125, -0.01789093017578125, -0.0052642822265625, 0.00736236572265625, 0.019989013671875, 0.03261566162109375, 0.0452423095703125, 0.05786895751953125, 0.07049560546875, 0.08312225341796875, 0.0957489013671875, 0.10837554931640625, 0.121002197265625, 0.13362884521484375, 0.1462554931640625, 0.15888214111328125, 0.1715087890625, 0.18413543701171875, 0.1967620849609375, 0.20938873291015625, 0.222015380859375, 0.23464202880859375, 0.2472686767578125, 0.25989532470703125, 0.27252197265625, 0.28514862060546875, 0.2977752685546875, 0.31040191650390625, 0.323028564453125, 0.33565521240234375, 0.3482818603515625, 0.36090850830078125, 0.37353515625]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 13.0, 40.0, 597.0, 310.0, 42.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.428099155426025, -6.589502334594727, -5.7509050369262695, -4.912308216094971, -4.073711395263672, -3.235114097595215, -2.396517276763916, -1.557919979095459, -0.7193231582641602, 0.119273841381073, 0.9578708410263062, 1.7964677810668945, 2.6350648403167725, 3.4736618995666504, 4.312258720397949, 5.150856018066406, 5.989452838897705, 6.828049659729004, 7.666646957397461, 8.505243301391602, 9.343840599060059, 10.182437896728516, 11.021034240722656, 11.85963249206543, 12.69822883605957, 13.536826133728027, 14.375422477722168, 15.214019775390625, 16.052616119384766, 16.89121437072754, 17.72981071472168, 18.568408966064453, 19.40700340270996, 20.2455997467041, 21.084197998046875, 21.922794342041016, 22.761390686035156, 23.59998893737793, 24.43858528137207, 25.277183532714844, 26.115779876708984, 26.954376220703125, 27.7929744720459, 28.63157081604004, 29.47016716003418, 30.308765411376953, 31.147361755371094, 31.985958099365234, 32.824554443359375, 33.663150787353516, 34.501747131347656, 35.34034729003906, 36.1789436340332, 37.017539978027344, 37.856136322021484, 38.694732666015625, 39.53333282470703, 40.37192916870117, 41.21052551269531, 42.04912567138672, 42.88772201538086, 43.726318359375, 44.56491470336914, 45.40351104736328, 46.24210739135742]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 2.0, 5.0, 11.0, 15.0, 6.0, 7.0, 11.0, 18.0, 21.0, 25.0, 49.0, 38.0, 40.0, 34.0, 45.0, 44.0, 62.0, 53.0, 48.0, 44.0, 49.0, 48.0, 45.0, 38.0, 47.0, 37.0, 23.0, 25.0, 23.0, 21.0, 16.0, 6.0, 16.0, 5.0, 4.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.437473297119141, -6.233244895935059, -6.029016017913818, -5.824787616729736, -5.620559215545654, -5.416330337524414, -5.212101936340332, -5.00787353515625, -4.803645133972168, -4.599416732788086, -4.395187854766846, -4.190959453582764, -3.9867310523986816, -3.7825024127960205, -3.5782737731933594, -3.3740453720092773, -3.169816493988037, -2.965587854385376, -2.761359453201294, -2.557130813598633, -2.352902412414551, -2.1486737728118896, -1.9444451332092285, -1.740216612815857, -1.5359880924224854, -1.3317595720291138, -1.1275310516357422, -0.923302412033081, -0.7190738916397095, -0.5148453712463379, -0.31061673164367676, -0.10638821125030518, 0.09784078598022461, 0.3020693361759186, 0.5062978863716125, 0.7105264663696289, 0.9147549867630005, 1.118983507156372, 1.3232121467590332, 1.5274406671524048, 1.7316691875457764, 1.935897707939148, 2.1401262283325195, 2.3443548679351807, 2.548583507537842, 2.752811908721924, 2.957040548324585, 3.161269187927246, 3.365497589111328, 3.5697262287139893, 3.7739546298980713, 3.9781832695007324, 4.1824116706848145, 4.386640548706055, 4.590868949890137, 4.795097351074219, 4.999325752258301, 5.203554153442383, 5.407783031463623, 5.612011432647705, 5.816239833831787, 6.020468711853027, 6.224697113037109, 6.428925514221191, 6.633154392242432]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 8.0, 3.0, 14.0, 26.0, 28.0, 80.0, 123.0, 196.0, 358.0, 662.0, 1337.0, 2970.0, 7755.0, 27969.0, 177790.0, 3573611.0, 344438.0, 39749.0, 10243.0, 3620.0, 1550.0, 765.0, 441.0, 208.0, 135.0, 80.0, 47.0, 25.0, 20.0, 15.0, 6.0, 7.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.46875, -2.38812255859375, -2.3074951171875, -2.22686767578125, -2.146240234375, -2.06561279296875, -1.9849853515625, -1.90435791015625, -1.82373046875, -1.74310302734375, -1.6624755859375, -1.58184814453125, -1.501220703125, -1.42059326171875, -1.3399658203125, -1.25933837890625, -1.1787109375, -1.09808349609375, -1.0174560546875, -0.93682861328125, -0.856201171875, -0.77557373046875, -0.6949462890625, -0.61431884765625, -0.53369140625, -0.45306396484375, -0.3724365234375, -0.29180908203125, -0.211181640625, -0.13055419921875, -0.0499267578125, 0.03070068359375, 0.111328125, 0.19195556640625, 0.2725830078125, 0.35321044921875, 0.433837890625, 0.51446533203125, 0.5950927734375, 0.67572021484375, 0.75634765625, 0.83697509765625, 0.9176025390625, 0.99822998046875, 1.078857421875, 1.15948486328125, 1.2401123046875, 1.32073974609375, 1.4013671875, 1.48199462890625, 1.5626220703125, 1.64324951171875, 1.723876953125, 1.80450439453125, 1.8851318359375, 1.96575927734375, 2.04638671875, 2.12701416015625, 2.2076416015625, 2.28826904296875, 2.368896484375, 2.44952392578125, 2.5301513671875, 2.61077880859375, 2.69140625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 8.0, 2.0, 2.0, 1.0, 5.0, 4.0, 11.0, 5.0, 19.0, 14.0, 18.0, 30.0, 30.0, 42.0, 47.0, 78.0, 83.0, 90.0, 90.0, 90.0, 57.0, 68.0, 33.0, 42.0, 36.0, 27.0, 21.0, 11.0, 10.0, 7.0, 5.0, 3.0, 7.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.423828125, -1.37152099609375, -1.3192138671875, -1.26690673828125, -1.214599609375, -1.16229248046875, -1.1099853515625, -1.05767822265625, -1.00537109375, -0.95306396484375, -0.9007568359375, -0.84844970703125, -0.796142578125, -0.74383544921875, -0.6915283203125, -0.63922119140625, -0.5869140625, -0.53460693359375, -0.4822998046875, -0.42999267578125, -0.377685546875, -0.32537841796875, -0.2730712890625, -0.22076416015625, -0.16845703125, -0.11614990234375, -0.0638427734375, -0.01153564453125, 0.040771484375, 0.09307861328125, 0.1453857421875, 0.19769287109375, 0.25, 0.30230712890625, 0.3546142578125, 0.40692138671875, 0.459228515625, 0.51153564453125, 0.5638427734375, 0.61614990234375, 0.66845703125, 0.72076416015625, 0.7730712890625, 0.82537841796875, 0.877685546875, 0.92999267578125, 0.9822998046875, 1.03460693359375, 1.0869140625, 1.13922119140625, 1.1915283203125, 1.24383544921875, 1.296142578125, 1.34844970703125, 1.4007568359375, 1.45306396484375, 1.50537109375, 1.55767822265625, 1.6099853515625, 1.66229248046875, 1.714599609375, 1.76690673828125, 1.8192138671875, 1.87152099609375, 1.923828125]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 11.0, 7.0, 11.0, 17.0, 19.0, 29.0, 43.0, 81.0, 123.0, 212.0, 349.0, 795.0, 1920.0, 6416.0, 34331.0, 879099.0, 3207453.0, 50880.0, 8240.0, 2356.0, 906.0, 409.0, 221.0, 118.0, 70.0, 50.0, 38.0, 21.0, 12.0, 11.0, 10.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.878021240234375, -2.77557373046875, -2.673126220703125, -2.5706787109375, -2.468231201171875, -2.36578369140625, -2.263336181640625, -2.160888671875, -2.058441162109375, -1.95599365234375, -1.853546142578125, -1.7510986328125, -1.648651123046875, -1.54620361328125, -1.443756103515625, -1.34130859375, -1.238861083984375, -1.13641357421875, -1.033966064453125, -0.9315185546875, -0.829071044921875, -0.72662353515625, -0.624176025390625, -0.521728515625, -0.419281005859375, -0.31683349609375, -0.214385986328125, -0.1119384765625, -0.009490966796875, 0.09295654296875, 0.195404052734375, 0.2978515625, 0.400299072265625, 0.50274658203125, 0.605194091796875, 0.7076416015625, 0.810089111328125, 0.91253662109375, 1.014984130859375, 1.117431640625, 1.219879150390625, 1.32232666015625, 1.424774169921875, 1.5272216796875, 1.629669189453125, 1.73211669921875, 1.834564208984375, 1.93701171875, 2.039459228515625, 2.14190673828125, 2.244354248046875, 2.3468017578125, 2.449249267578125, 2.55169677734375, 2.654144287109375, 2.756591796875, 2.859039306640625, 2.96148681640625, 3.063934326171875, 3.1663818359375, 3.268829345703125, 3.37127685546875, 3.473724365234375, 3.576171875]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 2.0, 9.0, 13.0, 24.0, 40.0, 40.0, 67.0, 112.0, 172.0, 366.0, 1283.0, 1072.0, 377.0, 169.0, 111.0, 82.0, 35.0, 23.0, 22.0, 12.0, 15.0, 9.0, 6.0, 2.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81298828125, -0.7883071899414062, -0.7636260986328125, -0.7389450073242188, -0.714263916015625, -0.6895828247070312, -0.6649017333984375, -0.6402206420898438, -0.61553955078125, -0.5908584594726562, -0.5661773681640625, -0.5414962768554688, -0.516815185546875, -0.49213409423828125, -0.4674530029296875, -0.44277191162109375, -0.4180908203125, -0.39340972900390625, -0.3687286376953125, -0.34404754638671875, -0.319366455078125, -0.29468536376953125, -0.2700042724609375, -0.24532318115234375, -0.22064208984375, -0.19596099853515625, -0.1712799072265625, -0.14659881591796875, -0.121917724609375, -0.09723663330078125, -0.0725555419921875, -0.04787445068359375, -0.023193359375, 0.00148773193359375, 0.0261688232421875, 0.05084991455078125, 0.075531005859375, 0.10021209716796875, 0.1248931884765625, 0.14957427978515625, 0.17425537109375, 0.19893646240234375, 0.2236175537109375, 0.24829864501953125, 0.272979736328125, 0.29766082763671875, 0.3223419189453125, 0.34702301025390625, 0.3717041015625, 0.39638519287109375, 0.4210662841796875, 0.44574737548828125, 0.470428466796875, 0.49510955810546875, 0.5197906494140625, 0.5444717407226562, 0.56915283203125, 0.5938339233398438, 0.6185150146484375, 0.6431961059570312, 0.667877197265625, 0.6925582885742188, 0.7172393798828125, 0.7419204711914062, 0.7666015625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 2.0, 4.0, 9.0, 11.0, 17.0, 27.0, 43.0, 86.0, 131.0, 182.0, 201.0, 135.0, 52.0, 35.0, 21.0, 10.0, 11.0, 8.0, 8.0, 4.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.7479658126831055, -4.625550270080566, -4.503134250640869, -4.38071870803833, -4.258302688598633, -4.135887145996094, -4.0134711265563965, -3.8910553455352783, -3.76863956451416, -3.646223783493042, -3.523808002471924, -3.4013922214508057, -3.2789764404296875, -3.1565606594085693, -3.034144878387451, -2.911729097366333, -2.789313316345215, -2.6668975353240967, -2.5444817543029785, -2.4220659732818604, -2.299650192260742, -2.177234411239624, -2.054818630218506, -1.9324028491973877, -1.8099873065948486, -1.6875715255737305, -1.5651557445526123, -1.4427399635314941, -1.320324182510376, -1.1979084014892578, -1.0754926204681396, -0.9530768990516663, -0.8306610584259033, -0.7082452774047852, -0.585829496383667, -0.4634137451648712, -0.34099796414375305, -0.21858221292495728, -0.09616643190383911, 0.026249349117279053, 0.14866513013839722, 0.2710809111595154, 0.39349669218063354, 0.5159124135971069, 0.6383281946182251, 0.7607439756393433, 0.8831597566604614, 1.0055755376815796, 1.1279913187026978, 1.250407099723816, 1.372822880744934, 1.4952386617660522, 1.6176544427871704, 1.740070104598999, 1.8624858856201172, 1.9849016666412354, 2.1073174476623535, 2.2297332286834717, 2.35214900970459, 2.474564790725708, 2.596980571746826, 2.7193963527679443, 2.8418121337890625, 2.9642279148101807, 3.086643695831299]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 3.0, 8.0, 6.0, 7.0, 15.0, 16.0, 23.0, 31.0, 31.0, 54.0, 60.0, 68.0, 69.0, 81.0, 56.0, 78.0, 76.0, 54.0, 48.0, 38.0, 44.0, 35.0, 34.0, 19.0, 17.0, 9.0, 7.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7363262176513672, -1.6730821132659912, -1.6098381280899048, -1.5465940237045288, -1.4833500385284424, -1.4201059341430664, -1.3568618297576904, -1.2936177253723145, -1.230373740196228, -1.167129635810852, -1.1038856506347656, -1.0406415462493896, -0.9773975014686584, -0.9141534566879272, -0.8509093523025513, -0.7876653075218201, -0.7244212627410889, -0.6611772179603577, -0.5979331731796265, -0.5346890687942505, -0.4714450240135193, -0.4082009792327881, -0.3449569046497345, -0.2817128300666809, -0.2184687852859497, -0.1552247256040573, -0.09198066592216492, -0.028736606240272522, 0.03450745344161987, 0.09775149822235107, 0.16099557280540466, 0.22423964738845825, 0.28748393058776855, 0.35072797536849976, 0.41397204995155334, 0.47721612453460693, 0.5404601693153381, 0.6037042140960693, 0.6669483184814453, 0.7301923632621765, 0.7934364080429077, 0.8566804528236389, 0.9199244976043701, 0.9831686019897461, 1.046412706375122, 1.1096566915512085, 1.1729007959365845, 1.236144781112671, 1.2993888854980469, 1.3626329898834229, 1.4258769750595093, 1.4891210794448853, 1.5523650646209717, 1.6156091690063477, 1.6788532733917236, 1.7420973777770996, 1.805341362953186, 1.868585467338562, 1.9318294525146484, 1.9950735569000244, 2.0583176612854004, 2.1215615272521973, 2.1848056316375732, 2.248049736022949, 2.311293840408325]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 2.0, 6.0, 4.0, 6.0, 12.0, 21.0, 30.0, 59.0, 84.0, 202.0, 597.0, 2628.0, 29748.0, 900015.0, 108418.0, 5221.0, 942.0, 272.0, 123.0, 72.0, 35.0, 24.0, 10.0, 11.0, 6.0, 6.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3544921875, -0.34168243408203125, -0.3288726806640625, -0.31606292724609375, -0.303253173828125, -0.29044342041015625, -0.2776336669921875, -0.26482391357421875, -0.25201416015625, -0.23920440673828125, -0.2263946533203125, -0.21358489990234375, -0.200775146484375, -0.18796539306640625, -0.1751556396484375, -0.16234588623046875, -0.1495361328125, -0.13672637939453125, -0.1239166259765625, -0.11110687255859375, -0.098297119140625, -0.08548736572265625, -0.0726776123046875, -0.05986785888671875, -0.04705810546875, -0.03424835205078125, -0.0214385986328125, -0.00862884521484375, 0.004180908203125, 0.01699066162109375, 0.0298004150390625, 0.04261016845703125, 0.055419921875, 0.06822967529296875, 0.0810394287109375, 0.09384918212890625, 0.106658935546875, 0.11946868896484375, 0.1322784423828125, 0.14508819580078125, 0.15789794921875, 0.17070770263671875, 0.1835174560546875, 0.19632720947265625, 0.209136962890625, 0.22194671630859375, 0.2347564697265625, 0.24756622314453125, 0.2603759765625, 0.27318572998046875, 0.2859954833984375, 0.29880523681640625, 0.311614990234375, 0.32442474365234375, 0.3372344970703125, 0.35004425048828125, 0.36285400390625, 0.37566375732421875, 0.3884735107421875, 0.40128326416015625, 0.414093017578125, 0.42690277099609375, 0.4397125244140625, 0.45252227783203125, 0.46533203125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 5.0, 5.0, 13.0, 15.0, 17.0, 41.0, 34.0, 59.0, 82.0, 100.0, 86.0, 95.0, 106.0, 69.0, 66.0, 52.0, 48.0, 39.0, 22.0, 10.0, 12.0, 6.0, 7.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5078125, -1.448486328125, -1.38916015625, -1.329833984375, -1.2705078125, -1.211181640625, -1.15185546875, -1.092529296875, -1.033203125, -0.973876953125, -0.91455078125, -0.855224609375, -0.7958984375, -0.736572265625, -0.67724609375, -0.617919921875, -0.55859375, -0.499267578125, -0.43994140625, -0.380615234375, -0.3212890625, -0.261962890625, -0.20263671875, -0.143310546875, -0.083984375, -0.024658203125, 0.03466796875, 0.093994140625, 0.1533203125, 0.212646484375, 0.27197265625, 0.331298828125, 0.390625, 0.449951171875, 0.50927734375, 0.568603515625, 0.6279296875, 0.687255859375, 0.74658203125, 0.805908203125, 0.865234375, 0.924560546875, 0.98388671875, 1.043212890625, 1.1025390625, 1.161865234375, 1.22119140625, 1.280517578125, 1.33984375, 1.399169921875, 1.45849609375, 1.517822265625, 1.5771484375, 1.636474609375, 1.69580078125, 1.755126953125, 1.814453125, 1.873779296875, 1.93310546875, 1.992431640625, 2.0517578125, 2.111083984375, 2.17041015625, 2.229736328125, 2.2890625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 6.0, 7.0, 14.0, 19.0, 23.0, 26.0, 30.0, 53.0, 77.0, 119.0, 194.0, 280.0, 641.0, 2088.0, 11946.0, 118976.0, 781921.0, 117575.0, 11177.0, 1888.0, 601.0, 291.0, 169.0, 119.0, 83.0, 43.0, 38.0, 26.0, 23.0, 17.0, 13.0, 7.0, 12.0, 6.0, 5.0, 10.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1600341796875, -0.15460777282714844, -0.14918136596679688, -0.1437549591064453, -0.13832855224609375, -0.1329021453857422, -0.12747573852539062, -0.12204933166503906, -0.1166229248046875, -0.11119651794433594, -0.10577011108398438, -0.10034370422363281, -0.09491729736328125, -0.08949089050292969, -0.08406448364257812, -0.07863807678222656, -0.073211669921875, -0.06778526306152344, -0.062358856201171875, -0.05693244934082031, -0.05150604248046875, -0.04607963562011719, -0.040653228759765625, -0.03522682189941406, -0.0298004150390625, -0.024374008178710938, -0.018947601318359375, -0.013521194458007812, -0.00809478759765625, -0.0026683807373046875, 0.002758026123046875, 0.008184432983398438, 0.01361083984375, 0.019037246704101562, 0.024463653564453125, 0.029890060424804688, 0.03531646728515625, 0.04074287414550781, 0.046169281005859375, 0.05159568786621094, 0.0570220947265625, 0.06244850158691406, 0.06787490844726562, 0.07330131530761719, 0.07872772216796875, 0.08415412902832031, 0.08958053588867188, 0.09500694274902344, 0.100433349609375, 0.10585975646972656, 0.11128616333007812, 0.11671257019042969, 0.12213897705078125, 0.1275653839111328, 0.13299179077148438, 0.13841819763183594, 0.1438446044921875, 0.14927101135253906, 0.15469741821289062, 0.1601238250732422, 0.16555023193359375, 0.1709766387939453, 0.17640304565429688, 0.18182945251464844, 0.187255859375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 10.0, 2.0, 6.0, 9.0, 9.0, 4.0, 11.0, 15.0, 15.0, 23.0, 26.0, 28.0, 18.0, 29.0, 36.0, 34.0, 52.0, 44.0, 54.0, 47.0, 51.0, 49.0, 40.0, 59.0, 42.0, 41.0, 35.0, 37.0, 35.0, 25.0, 16.0, 22.0, 19.0, 8.0, 11.0, 8.0, 8.0, 3.0, 6.0, 11.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8525390625, -1.79315185546875, -1.7337646484375, -1.67437744140625, -1.614990234375, -1.55560302734375, -1.4962158203125, -1.43682861328125, -1.37744140625, -1.31805419921875, -1.2586669921875, -1.19927978515625, -1.139892578125, -1.08050537109375, -1.0211181640625, -0.96173095703125, -0.90234375, -0.84295654296875, -0.7835693359375, -0.72418212890625, -0.664794921875, -0.60540771484375, -0.5460205078125, -0.48663330078125, -0.42724609375, -0.36785888671875, -0.3084716796875, -0.24908447265625, -0.189697265625, -0.13031005859375, -0.0709228515625, -0.01153564453125, 0.0478515625, 0.10723876953125, 0.1666259765625, 0.22601318359375, 0.285400390625, 0.34478759765625, 0.4041748046875, 0.46356201171875, 0.52294921875, 0.58233642578125, 0.6417236328125, 0.70111083984375, 0.760498046875, 0.81988525390625, 0.8792724609375, 0.93865966796875, 0.998046875, 1.05743408203125, 1.1168212890625, 1.17620849609375, 1.235595703125, 1.29498291015625, 1.3543701171875, 1.41375732421875, 1.47314453125, 1.53253173828125, 1.5919189453125, 1.65130615234375, 1.710693359375, 1.77008056640625, 1.8294677734375, 1.88885498046875, 1.9482421875]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 5.0, 7.0, 7.0, 13.0, 19.0, 20.0, 33.0, 43.0, 52.0, 79.0, 154.0, 304.0, 750.0, 2927.0, 77190.0, 958491.0, 6466.0, 1093.0, 357.0, 184.0, 102.0, 66.0, 42.0, 41.0, 25.0, 21.0, 14.0, 10.0, 7.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042755126953125, -0.041182518005371094, -0.03960990905761719, -0.03803730010986328, -0.036464691162109375, -0.03489208221435547, -0.03331947326660156, -0.031746864318847656, -0.03017425537109375, -0.028601646423339844, -0.027029037475585938, -0.02545642852783203, -0.023883819580078125, -0.02231121063232422, -0.020738601684570312, -0.019165992736816406, -0.0175933837890625, -0.016020774841308594, -0.014448165893554688, -0.012875556945800781, -0.011302947998046875, -0.009730339050292969, -0.008157730102539062, -0.006585121154785156, -0.00501251220703125, -0.0034399032592773438, -0.0018672943115234375, -0.00029468536376953125, 0.001277923583984375, 0.0028505325317382812, 0.0044231414794921875, 0.005995750427246094, 0.007568359375, 0.009140968322753906, 0.010713577270507812, 0.012286186218261719, 0.013858795166015625, 0.015431404113769531, 0.017004013061523438, 0.018576622009277344, 0.02014923095703125, 0.021721839904785156, 0.023294448852539062, 0.02486705780029297, 0.026439666748046875, 0.02801227569580078, 0.029584884643554688, 0.031157493591308594, 0.0327301025390625, 0.034302711486816406, 0.03587532043457031, 0.03744792938232422, 0.039020538330078125, 0.04059314727783203, 0.04216575622558594, 0.043738365173339844, 0.04531097412109375, 0.046883583068847656, 0.04845619201660156, 0.05002880096435547, 0.051601409912109375, 0.05317401885986328, 0.05474662780761719, 0.056319236755371094, 0.057891845703125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 4.0, 2.0, 2.0, 4.0, 9.0, 4.0, 13.0, 25.0, 21.0, 33.0, 67.0, 117.0, 160.0, 138.0, 125.0, 89.0, 64.0, 46.0, 29.0, 10.0, 10.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3530254364013672e-05, -1.2949109077453613e-05, -1.2367963790893555e-05, -1.1786818504333496e-05, -1.1205673217773438e-05, -1.0624527931213379e-05, -1.004338264465332e-05, -9.462237358093262e-06, -8.881092071533203e-06, -8.299946784973145e-06, -7.718801498413086e-06, -7.137656211853027e-06, -6.556510925292969e-06, -5.97536563873291e-06, -5.3942203521728516e-06, -4.813075065612793e-06, -4.231929779052734e-06, -3.6507844924926758e-06, -3.069639205932617e-06, -2.4884939193725586e-06, -1.9073486328125e-06, -1.3262033462524414e-06, -7.450580596923828e-07, -1.6391277313232422e-07, 4.172325134277344e-07, 9.98377799987793e-07, 1.5795230865478516e-06, 2.16066837310791e-06, 2.7418136596679688e-06, 3.3229589462280273e-06, 3.904104232788086e-06, 4.4852495193481445e-06, 5.066394805908203e-06, 5.647540092468262e-06, 6.22868537902832e-06, 6.809830665588379e-06, 7.3909759521484375e-06, 7.972121238708496e-06, 8.553266525268555e-06, 9.134411811828613e-06, 9.715557098388672e-06, 1.029670238494873e-05, 1.0877847671508789e-05, 1.1458992958068848e-05, 1.2040138244628906e-05, 1.2621283531188965e-05, 1.3202428817749023e-05, 1.3783574104309082e-05, 1.436471939086914e-05, 1.49458646774292e-05, 1.5527009963989258e-05, 1.6108155250549316e-05, 1.6689300537109375e-05, 1.7270445823669434e-05, 1.7851591110229492e-05, 1.843273639678955e-05, 1.901388168334961e-05, 1.9595026969909668e-05, 2.0176172256469727e-05, 2.0757317543029785e-05, 2.1338462829589844e-05, 2.1919608116149902e-05, 2.250075340270996e-05, 2.308189868927002e-05, 2.3663043975830078e-05]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 4.0, 6.0, 6.0, 9.0, 12.0, 30.0, 25.0, 42.0, 73.0, 96.0, 188.0, 381.0, 736.0, 2432.0, 13394.0, 902416.0, 118971.0, 6831.0, 1614.0, 560.0, 297.0, 148.0, 85.0, 64.0, 50.0, 31.0, 17.0, 13.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06719970703125, -0.06486892700195312, -0.06253814697265625, -0.060207366943359375, -0.0578765869140625, -0.055545806884765625, -0.05321502685546875, -0.050884246826171875, -0.048553466796875, -0.046222686767578125, -0.04389190673828125, -0.041561126708984375, -0.0392303466796875, -0.036899566650390625, -0.03456878662109375, -0.032238006591796875, -0.0299072265625, -0.027576446533203125, -0.02524566650390625, -0.022914886474609375, -0.0205841064453125, -0.018253326416015625, -0.01592254638671875, -0.013591766357421875, -0.011260986328125, -0.008930206298828125, -0.00659942626953125, -0.004268646240234375, -0.0019378662109375, 0.000392913818359375, 0.00272369384765625, 0.005054473876953125, 0.00738525390625, 0.009716033935546875, 0.01204681396484375, 0.014377593994140625, 0.0167083740234375, 0.019039154052734375, 0.02136993408203125, 0.023700714111328125, 0.026031494140625, 0.028362274169921875, 0.03069305419921875, 0.033023834228515625, 0.0353546142578125, 0.037685394287109375, 0.04001617431640625, 0.042346954345703125, 0.044677734375, 0.047008514404296875, 0.04933929443359375, 0.051670074462890625, 0.0540008544921875, 0.056331634521484375, 0.05866241455078125, 0.060993194580078125, 0.063323974609375, 0.06565475463867188, 0.06798553466796875, 0.07031631469726562, 0.0726470947265625, 0.07497787475585938, 0.07730865478515625, 0.07963943481445312, 0.08197021484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 9.0, 10.0, 11.0, 14.0, 25.0, 32.0, 38.0, 78.0, 161.0, 183.0, 167.0, 95.0, 53.0, 33.0, 27.0, 23.0, 12.0, 11.0, 6.0, 6.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00777435302734375, -0.007582962512969971, -0.007391571998596191, -0.007200181484222412, -0.007008790969848633, -0.0068174004554748535, -0.006626009941101074, -0.006434619426727295, -0.006243228912353516, -0.006051838397979736, -0.005860447883605957, -0.005669057369232178, -0.0054776668548583984, -0.005286276340484619, -0.00509488582611084, -0.0049034953117370605, -0.004712104797363281, -0.004520714282989502, -0.004329323768615723, -0.004137933254241943, -0.003946542739868164, -0.0037551522254943848, -0.0035637617111206055, -0.003372371196746826, -0.003180980682373047, -0.0029895901679992676, -0.0027981996536254883, -0.002606809139251709, -0.0024154186248779297, -0.0022240281105041504, -0.002032637596130371, -0.0018412470817565918, -0.0016498565673828125, -0.0014584660530090332, -0.001267075538635254, -0.0010756850242614746, -0.0008842945098876953, -0.000692903995513916, -0.0005015134811401367, -0.0003101229667663574, -0.00011873245239257812, 7.265806198120117e-05, 0.00026404857635498047, 0.00045543909072875977, 0.0006468296051025391, 0.0008382201194763184, 0.0010296106338500977, 0.001221001148223877, 0.0014123916625976562, 0.0016037821769714355, 0.0017951726913452148, 0.001986563205718994, 0.0021779537200927734, 0.0023693442344665527, 0.002560734748840332, 0.0027521252632141113, 0.0029435157775878906, 0.00313490629196167, 0.0033262968063354492, 0.0035176873207092285, 0.003709077835083008, 0.003900468349456787, 0.004091858863830566, 0.004283249378204346, 0.004474639892578125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 12.0, 17.0, 30.0, 40.0, 101.0, 195.0, 228.0, 194.0, 74.0, 43.0, 16.0, 14.0, 11.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8177742958068848, -3.7183310985565186, -3.6188876628875732, -3.519444465637207, -3.420001268386841, -3.3205578327178955, -3.2211146354675293, -3.121671199798584, -3.0222280025482178, -2.9227848052978516, -2.8233413696289062, -2.72389817237854, -2.624454975128174, -2.5250115394592285, -2.4255683422088623, -2.326125144958496, -2.226681709289551, -2.1272385120391846, -2.0277950763702393, -1.928351879119873, -1.8289085626602173, -1.7294652462005615, -1.6300220489501953, -1.5305787324905396, -1.431135654449463, -1.3316923379898071, -1.232249140739441, -1.1328058242797852, -1.0333625078201294, -0.9339192509651184, -0.8344759941101074, -0.7350326776504517, -0.6355893611907959, -0.5361461043357849, -0.43670278787612915, -0.33725953102111816, -0.2378162443637848, -0.13837295770645142, -0.03892970085144043, 0.06051361560821533, 0.15995687246322632, 0.2594001591205597, 0.35884344577789307, 0.45828670263290405, 0.557729959487915, 0.6571732759475708, 0.7566165328025818, 0.8560598492622375, 0.9555031061172485, 1.0549464225769043, 1.1543896198272705, 1.2538329362869263, 1.353276252746582, 1.4527194499969482, 1.552162766456604, 1.6516060829162598, 1.751049280166626, 1.8504925966262817, 1.949935793876648, 2.0493791103363037, 2.14882230758667, 2.2482657432556152, 2.3477089405059814, 2.4471521377563477, 2.546595573425293]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 5.0, 15.0, 19.0, 26.0, 34.0, 40.0, 71.0, 72.0, 93.0, 100.0, 81.0, 99.0, 74.0, 52.0, 54.0, 46.0, 37.0, 20.0, 18.0, 8.0, 4.0, 5.0, 6.0, 2.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.456957459449768, -1.4033881425857544, -1.3498188257217407, -1.2962493896484375, -1.2426800727844238, -1.1891107559204102, -1.1355414390563965, -1.0819721221923828, -1.0284026861190796, -0.9748333692550659, -0.9212639927864075, -0.8676946759223938, -0.8141252994537354, -0.7605559825897217, -0.706986665725708, -0.6534172892570496, -0.5998479723930359, -0.5462786555290222, -0.49270927906036377, -0.4391399621963501, -0.38557058572769165, -0.332001268863678, -0.2784319221973419, -0.22486257553100586, -0.1712932288646698, -0.11772388219833374, -0.06415454298257828, -0.010585203766822815, 0.042984142899513245, 0.09655347466468811, 0.15012282133102417, 0.20369216799736023, 0.2572615146636963, 0.31083086133003235, 0.3644002079963684, 0.4179695248603821, 0.4715389013290405, 0.5251082181930542, 0.5786775350570679, 0.6322469115257263, 0.6858162879943848, 0.7393856048583984, 0.7929549813270569, 0.8465242981910706, 0.900093674659729, 0.9536629915237427, 1.0072323083877563, 1.0608017444610596, 1.1143710613250732, 1.167940378189087, 1.2215096950531006, 1.2750791311264038, 1.3286484479904175, 1.3822177648544312, 1.4357870817184448, 1.489356517791748, 1.5429257154464722, 1.5964950323104858, 1.6500643491744995, 1.7036337852478027, 1.7572031021118164, 1.81077241897583, 1.8643417358398438, 1.9179110527038574, 1.9714804887771606]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 8.0, 13.0, 17.0, 14.0, 22.0, 26.0, 31.0, 54.0, 84.0, 111.0, 176.0, 222.0, 403.0, 563.0, 841.0, 1422.0, 2252.0, 3897.0, 7671.0, 17071.0, 53099.0, 326071.0, 521631.0, 71639.0, 21178.0, 8709.0, 4460.0, 2472.0, 1487.0, 976.0, 592.0, 429.0, 277.0, 170.0, 124.0, 95.0, 68.0, 47.0, 41.0, 30.0, 17.0, 13.0, 8.0, 8.0, 6.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-1.228515625, -1.19140625, -1.154296875, -1.1171875, -1.080078125, -1.04296875, -1.005859375, -0.96875, -0.931640625, -0.89453125, -0.857421875, -0.8203125, -0.783203125, -0.74609375, -0.708984375, -0.671875, -0.634765625, -0.59765625, -0.560546875, -0.5234375, -0.486328125, -0.44921875, -0.412109375, -0.375, -0.337890625, -0.30078125, -0.263671875, -0.2265625, -0.189453125, -0.15234375, -0.115234375, -0.078125, -0.041015625, -0.00390625, 0.033203125, 0.0703125, 0.107421875, 0.14453125, 0.181640625, 0.21875, 0.255859375, 0.29296875, 0.330078125, 0.3671875, 0.404296875, 0.44140625, 0.478515625, 0.515625, 0.552734375, 0.58984375, 0.626953125, 0.6640625, 0.701171875, 0.73828125, 0.775390625, 0.8125, 0.849609375, 0.88671875, 0.923828125, 0.9609375, 0.998046875, 1.03515625, 1.072265625, 1.109375, 1.146484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 12.0, 10.0, 12.0, 25.0, 26.0, 37.0, 57.0, 55.0, 87.0, 78.0, 93.0, 97.0, 82.0, 51.0, 62.0, 47.0, 48.0, 39.0, 17.0, 15.0, 8.0, 4.0, 6.0, 5.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.138671875, -3.033172607421875, -2.92767333984375, -2.822174072265625, -2.7166748046875, -2.611175537109375, -2.50567626953125, -2.400177001953125, -2.294677734375, -2.189178466796875, -2.08367919921875, -1.978179931640625, -1.8726806640625, -1.767181396484375, -1.66168212890625, -1.556182861328125, -1.45068359375, -1.345184326171875, -1.23968505859375, -1.134185791015625, -1.0286865234375, -0.923187255859375, -0.81768798828125, -0.712188720703125, -0.606689453125, -0.501190185546875, -0.39569091796875, -0.290191650390625, -0.1846923828125, -0.079193115234375, 0.02630615234375, 0.131805419921875, 0.2373046875, 0.342803955078125, 0.44830322265625, 0.553802490234375, 0.6593017578125, 0.764801025390625, 0.87030029296875, 0.975799560546875, 1.081298828125, 1.186798095703125, 1.29229736328125, 1.397796630859375, 1.5032958984375, 1.608795166015625, 1.71429443359375, 1.819793701171875, 1.92529296875, 2.030792236328125, 2.13629150390625, 2.241790771484375, 2.3472900390625, 2.452789306640625, 2.55828857421875, 2.663787841796875, 2.769287109375, 2.874786376953125, 2.98028564453125, 3.085784912109375, 3.1912841796875, 3.296783447265625, 3.40228271484375, 3.507781982421875, 3.61328125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 8.0, 5.0, 17.0, 18.0, 16.0, 37.0, 46.0, 79.0, 139.0, 259.0, 549.0, 1151.0, 3040.0, 10414.0, 55376.0, 827832.0, 125984.0, 16092.0, 4599.0, 1491.0, 665.0, 299.0, 160.0, 80.0, 62.0, 47.0, 27.0, 19.0, 11.0, 15.0, 6.0, 6.0, 1.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7138671875, -1.657958984375, -1.60205078125, -1.546142578125, -1.490234375, -1.434326171875, -1.37841796875, -1.322509765625, -1.2666015625, -1.210693359375, -1.15478515625, -1.098876953125, -1.04296875, -0.987060546875, -0.93115234375, -0.875244140625, -0.8193359375, -0.763427734375, -0.70751953125, -0.651611328125, -0.595703125, -0.539794921875, -0.48388671875, -0.427978515625, -0.3720703125, -0.316162109375, -0.26025390625, -0.204345703125, -0.1484375, -0.092529296875, -0.03662109375, 0.019287109375, 0.0751953125, 0.131103515625, 0.18701171875, 0.242919921875, 0.298828125, 0.354736328125, 0.41064453125, 0.466552734375, 0.5224609375, 0.578369140625, 0.63427734375, 0.690185546875, 0.74609375, 0.802001953125, 0.85791015625, 0.913818359375, 0.9697265625, 1.025634765625, 1.08154296875, 1.137451171875, 1.193359375, 1.249267578125, 1.30517578125, 1.361083984375, 1.4169921875, 1.472900390625, 1.52880859375, 1.584716796875, 1.640625, 1.696533203125, 1.75244140625, 1.808349609375, 1.8642578125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 6.0, 9.0, 3.0, 10.0, 7.0, 12.0, 17.0, 18.0, 25.0, 37.0, 30.0, 27.0, 34.0, 22.0, 32.0, 53.0, 56.0, 47.0, 43.0, 50.0, 33.0, 45.0, 45.0, 39.0, 41.0, 34.0, 33.0, 32.0, 34.0, 20.0, 21.0, 11.0, 11.0, 13.0, 9.0, 13.0, 9.0, 7.0, 3.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2734375, -2.18695068359375, -2.1004638671875, -2.01397705078125, -1.927490234375, -1.84100341796875, -1.7545166015625, -1.66802978515625, -1.58154296875, -1.49505615234375, -1.4085693359375, -1.32208251953125, -1.235595703125, -1.14910888671875, -1.0626220703125, -0.97613525390625, -0.8896484375, -0.80316162109375, -0.7166748046875, -0.63018798828125, -0.543701171875, -0.45721435546875, -0.3707275390625, -0.28424072265625, -0.19775390625, -0.11126708984375, -0.0247802734375, 0.06170654296875, 0.148193359375, 0.23468017578125, 0.3211669921875, 0.40765380859375, 0.494140625, 0.58062744140625, 0.6671142578125, 0.75360107421875, 0.840087890625, 0.92657470703125, 1.0130615234375, 1.09954833984375, 1.18603515625, 1.27252197265625, 1.3590087890625, 1.44549560546875, 1.531982421875, 1.61846923828125, 1.7049560546875, 1.79144287109375, 1.8779296875, 1.96441650390625, 2.0509033203125, 2.13739013671875, 2.223876953125, 2.31036376953125, 2.3968505859375, 2.48333740234375, 2.56982421875, 2.65631103515625, 2.7427978515625, 2.82928466796875, 2.915771484375, 3.00225830078125, 3.0887451171875, 3.17523193359375, 3.26171875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 4.0, 3.0, 10.0, 6.0, 11.0, 10.0, 12.0, 17.0, 37.0, 62.0, 86.0, 170.0, 392.0, 924.0, 2452.0, 8842.0, 115516.0, 890727.0, 22301.0, 4370.0, 1431.0, 566.0, 274.0, 137.0, 73.0, 36.0, 30.0, 19.0, 8.0, 8.0, 6.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3193359375, -1.2808074951171875, -1.242279052734375, -1.2037506103515625, -1.16522216796875, -1.1266937255859375, -1.088165283203125, -1.0496368408203125, -1.0111083984375, -0.9725799560546875, -0.934051513671875, -0.8955230712890625, -0.85699462890625, -0.8184661865234375, -0.779937744140625, -0.7414093017578125, -0.702880859375, -0.6643524169921875, -0.625823974609375, -0.5872955322265625, -0.54876708984375, -0.5102386474609375, -0.471710205078125, -0.4331817626953125, -0.3946533203125, -0.3561248779296875, -0.317596435546875, -0.2790679931640625, -0.24053955078125, -0.2020111083984375, -0.163482666015625, -0.1249542236328125, -0.08642578125, -0.0478973388671875, -0.009368896484375, 0.0291595458984375, 0.06768798828125, 0.1062164306640625, 0.144744873046875, 0.1832733154296875, 0.2218017578125, 0.2603302001953125, 0.298858642578125, 0.3373870849609375, 0.37591552734375, 0.4144439697265625, 0.452972412109375, 0.4915008544921875, 0.530029296875, 0.5685577392578125, 0.607086181640625, 0.6456146240234375, 0.68414306640625, 0.7226715087890625, 0.761199951171875, 0.7997283935546875, 0.8382568359375, 0.8767852783203125, 0.915313720703125, 0.9538421630859375, 0.99237060546875, 1.0308990478515625, 1.069427490234375, 1.1079559326171875, 1.146484375]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 9.0, 6.0, 18.0, 34.0, 65.0, 120.0, 319.0, 217.0, 94.0, 44.0, 19.0, 17.0, 16.0, 6.0, 8.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019121170043945312, -0.00018586963415145874, -0.00018052756786346436, -0.00017518550157546997, -0.00016984343528747559, -0.0001645013689994812, -0.00015915930271148682, -0.00015381723642349243, -0.00014847517013549805, -0.00014313310384750366, -0.00013779103755950928, -0.0001324489712715149, -0.0001271069049835205, -0.00012176483869552612, -0.00011642277240753174, -0.00011108070611953735, -0.00010573863983154297, -0.00010039657354354858, -9.50545072555542e-05, -8.971244096755981e-05, -8.437037467956543e-05, -7.902830839157104e-05, -7.368624210357666e-05, -6.834417581558228e-05, -6.300210952758789e-05, -5.7660043239593506e-05, -5.231797695159912e-05, -4.6975910663604736e-05, -4.163384437561035e-05, -3.629177808761597e-05, -3.094971179962158e-05, -2.5607645511627197e-05, -2.0265579223632812e-05, -1.4923512935638428e-05, -9.581446647644043e-06, -4.239380359649658e-06, 1.1026859283447266e-06, 6.444752216339111e-06, 1.1786818504333496e-05, 1.712888479232788e-05, 2.2470951080322266e-05, 2.781301736831665e-05, 3.3155083656311035e-05, 3.849714994430542e-05, 4.3839216232299805e-05, 4.918128252029419e-05, 5.4523348808288574e-05, 5.986541509628296e-05, 6.520748138427734e-05, 7.054954767227173e-05, 7.589161396026611e-05, 8.12336802482605e-05, 8.657574653625488e-05, 9.191781282424927e-05, 9.725987911224365e-05, 0.00010260194540023804, 0.00010794401168823242, 0.0001132860779762268, 0.00011862814426422119, 0.00012397021055221558, 0.00012931227684020996, 0.00013465434312820435, 0.00013999640941619873, 0.00014533847570419312, 0.0001506805419921875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 5.0, 8.0, 7.0, 10.0, 16.0, 14.0, 17.0, 30.0, 31.0, 55.0, 94.0, 128.0, 195.0, 407.0, 834.0, 2122.0, 6401.0, 32086.0, 768428.0, 212721.0, 17541.0, 4284.0, 1566.0, 654.0, 353.0, 185.0, 103.0, 62.0, 55.0, 41.0, 21.0, 13.0, 12.0, 8.0, 9.0, 8.0, 9.0, 2.0, 5.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.880859375, -0.852294921875, -0.82373046875, -0.795166015625, -0.7666015625, -0.738037109375, -0.70947265625, -0.680908203125, -0.65234375, -0.623779296875, -0.59521484375, -0.566650390625, -0.5380859375, -0.509521484375, -0.48095703125, -0.452392578125, -0.423828125, -0.395263671875, -0.36669921875, -0.338134765625, -0.3095703125, -0.281005859375, -0.25244140625, -0.223876953125, -0.1953125, -0.166748046875, -0.13818359375, -0.109619140625, -0.0810546875, -0.052490234375, -0.02392578125, 0.004638671875, 0.033203125, 0.061767578125, 0.09033203125, 0.118896484375, 0.1474609375, 0.176025390625, 0.20458984375, 0.233154296875, 0.26171875, 0.290283203125, 0.31884765625, 0.347412109375, 0.3759765625, 0.404541015625, 0.43310546875, 0.461669921875, 0.490234375, 0.518798828125, 0.54736328125, 0.575927734375, 0.6044921875, 0.633056640625, 0.66162109375, 0.690185546875, 0.71875, 0.747314453125, 0.77587890625, 0.804443359375, 0.8330078125, 0.861572265625, 0.89013671875, 0.918701171875, 0.947265625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 7.0, 4.0, 8.0, 9.0, 7.0, 13.0, 14.0, 24.0, 45.0, 98.0, 154.0, 264.0, 140.0, 75.0, 45.0, 28.0, 10.0, 10.0, 14.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37841796875, -0.36554718017578125, -0.3526763916015625, -0.33980560302734375, -0.326934814453125, -0.31406402587890625, -0.3011932373046875, -0.28832244873046875, -0.27545166015625, -0.26258087158203125, -0.2497100830078125, -0.23683929443359375, -0.223968505859375, -0.21109771728515625, -0.1982269287109375, -0.18535614013671875, -0.1724853515625, -0.15961456298828125, -0.1467437744140625, -0.13387298583984375, -0.121002197265625, -0.10813140869140625, -0.0952606201171875, -0.08238983154296875, -0.06951904296875, -0.05664825439453125, -0.0437774658203125, -0.03090667724609375, -0.018035888671875, -0.00516510009765625, 0.0077056884765625, 0.02057647705078125, 0.033447265625, 0.04631805419921875, 0.0591888427734375, 0.07205963134765625, 0.084930419921875, 0.09780120849609375, 0.1106719970703125, 0.12354278564453125, 0.13641357421875, 0.14928436279296875, 0.1621551513671875, 0.17502593994140625, 0.187896728515625, 0.20076751708984375, 0.2136383056640625, 0.22650909423828125, 0.2393798828125, 0.25225067138671875, 0.2651214599609375, 0.27799224853515625, 0.290863037109375, 0.30373382568359375, 0.3166046142578125, 0.32947540283203125, 0.34234619140625, 0.35521697998046875, 0.3680877685546875, 0.38095855712890625, 0.393829345703125, 0.40670013427734375, 0.4195709228515625, 0.43244171142578125, 0.4453125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 9.0, 33.0, 155.0, 506.0, 231.0, 44.0, 15.0, 7.0, 5.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.974451065063477, -15.452621459960938, -14.930791854858398, -14.40896224975586, -13.88713264465332, -13.365303039550781, -12.843472480773926, -12.321642875671387, -11.799813270568848, -11.277983665466309, -10.75615406036377, -10.23432445526123, -9.712493896484375, -9.190664291381836, -8.668834686279297, -8.147005081176758, -7.625175476074219, -7.10334587097168, -6.581516265869141, -6.059686183929443, -5.537856578826904, -5.016026973724365, -4.494196891784668, -3.972367286682129, -3.45053768157959, -2.928708076477051, -2.4068782329559326, -1.885048508644104, -1.3632187843322754, -0.8413891792297363, -0.31955933570861816, 0.2022705078125, 0.7240982055664062, 1.2459279298782349, 1.7677576541900635, 2.2895874977111816, 2.8114171028137207, 3.3332467079162598, 3.855076551437378, 4.376906394958496, 4.898736000061035, 5.420565605163574, 5.942395210266113, 6.4642252922058105, 6.98605489730835, 7.507884502410889, 8.029714584350586, 8.551544189453125, 9.073373794555664, 9.595203399658203, 10.117033004760742, 10.638862609863281, 11.16069221496582, 11.68252182006836, 12.204352378845215, 12.726181983947754, 13.248011589050293, 13.769841194152832, 14.291670799255371, 14.81350040435791, 15.335330963134766, 15.857160568237305, 16.378990173339844, 16.900819778442383, 17.422649383544922]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 2.0, 10.0, 10.0, 14.0, 18.0, 19.0, 21.0, 35.0, 34.0, 27.0, 36.0, 53.0, 49.0, 48.0, 61.0, 56.0, 64.0, 47.0, 60.0, 60.0, 38.0, 38.0, 36.0, 32.0, 24.0, 23.0, 19.0, 14.0, 14.0, 11.0, 5.0, 5.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.235995769500732, -5.043769836425781, -4.85154390335083, -4.659317970275879, -4.467092514038086, -4.274866580963135, -4.082640647888184, -3.8904147148132324, -3.6981887817382812, -3.50596284866333, -3.313736915588379, -3.121511220932007, -2.9292852878570557, -2.7370593547821045, -2.5448336601257324, -2.3526077270507812, -2.16038179397583, -1.968155860900879, -1.7759300470352173, -1.5837042331695557, -1.3914783000946045, -1.1992523670196533, -1.0070265531539917, -0.8148007392883301, -0.6225748062133789, -0.4303489327430725, -0.2381230592727661, -0.04589718580245972, 0.14632868766784668, 0.3385545611381531, 0.5307804346084595, 0.7230062484741211, 0.9152321815490723, 1.1074581146240234, 1.299683928489685, 1.4919097423553467, 1.6841356754302979, 1.876361608505249, 2.068587303161621, 2.2608132362365723, 2.4530391693115234, 2.6452651023864746, 2.837491035461426, 3.029716730117798, 3.221942663192749, 3.4141685962677, 3.6063942909240723, 3.7986202239990234, 3.9908461570739746, 4.183072090148926, 4.375298023223877, 4.567523956298828, 4.759749412536621, 4.951975345611572, 5.144201278686523, 5.336427211761475, 5.528653144836426, 5.720879077911377, 5.913105010986328, 6.105330944061279, 6.2975568771362305, 6.489782333374023, 6.682008266448975, 6.874234199523926, 7.066460132598877]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 13.0, 14.0, 12.0, 23.0, 29.0, 52.0, 77.0, 141.0, 221.0, 462.0, 916.0, 2317.0, 6905.0, 29545.0, 302855.0, 3683640.0, 139709.0, 18546.0, 5056.0, 1929.0, 853.0, 381.0, 210.0, 145.0, 90.0, 49.0, 28.0, 18.0, 17.0, 10.0, 7.0, 6.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.892578125, -2.800384521484375, -2.70819091796875, -2.615997314453125, -2.5238037109375, -2.431610107421875, -2.33941650390625, -2.247222900390625, -2.155029296875, -2.062835693359375, -1.97064208984375, -1.878448486328125, -1.7862548828125, -1.694061279296875, -1.60186767578125, -1.509674072265625, -1.41748046875, -1.325286865234375, -1.23309326171875, -1.140899658203125, -1.0487060546875, -0.956512451171875, -0.86431884765625, -0.772125244140625, -0.679931640625, -0.587738037109375, -0.49554443359375, -0.403350830078125, -0.3111572265625, -0.218963623046875, -0.12677001953125, -0.034576416015625, 0.0576171875, 0.149810791015625, 0.24200439453125, 0.334197998046875, 0.4263916015625, 0.518585205078125, 0.61077880859375, 0.702972412109375, 0.795166015625, 0.887359619140625, 0.97955322265625, 1.071746826171875, 1.1639404296875, 1.256134033203125, 1.34832763671875, 1.440521240234375, 1.53271484375, 1.624908447265625, 1.71710205078125, 1.809295654296875, 1.9014892578125, 1.993682861328125, 2.08587646484375, 2.178070068359375, 2.270263671875, 2.362457275390625, 2.45465087890625, 2.546844482421875, 2.6390380859375, 2.731231689453125, 2.82342529296875, 2.915618896484375, 3.0078125]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 8.0, 6.0, 4.0, 15.0, 6.0, 23.0, 28.0, 29.0, 42.0, 62.0, 73.0, 92.0, 74.0, 90.0, 82.0, 67.0, 78.0, 54.0, 41.0, 30.0, 19.0, 16.0, 12.0, 7.0, 6.0, 3.0, 3.0, 8.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4150390625, -1.3591461181640625, -1.303253173828125, -1.2473602294921875, -1.19146728515625, -1.1355743408203125, -1.079681396484375, -1.0237884521484375, -0.9678955078125, -0.9120025634765625, -0.856109619140625, -0.8002166748046875, -0.74432373046875, -0.6884307861328125, -0.632537841796875, -0.5766448974609375, -0.520751953125, -0.4648590087890625, -0.408966064453125, -0.3530731201171875, -0.29718017578125, -0.2412872314453125, -0.185394287109375, -0.1295013427734375, -0.0736083984375, -0.0177154541015625, 0.038177490234375, 0.0940704345703125, 0.14996337890625, 0.2058563232421875, 0.261749267578125, 0.3176422119140625, 0.37353515625, 0.4294281005859375, 0.485321044921875, 0.5412139892578125, 0.59710693359375, 0.6529998779296875, 0.708892822265625, 0.7647857666015625, 0.8206787109375, 0.8765716552734375, 0.932464599609375, 0.9883575439453125, 1.04425048828125, 1.1001434326171875, 1.156036376953125, 1.2119293212890625, 1.267822265625, 1.3237152099609375, 1.379608154296875, 1.4355010986328125, 1.49139404296875, 1.5472869873046875, 1.603179931640625, 1.6590728759765625, 1.7149658203125, 1.7708587646484375, 1.826751708984375, 1.8826446533203125, 1.93853759765625, 1.9944305419921875, 2.050323486328125, 2.1062164306640625, 2.162109375]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 3.0, 4.0, 5.0, 18.0, 22.0, 37.0, 57.0, 100.0, 204.0, 402.0, 844.0, 2624.0, 11695.0, 129346.0, 3905513.0, 127317.0, 11696.0, 2583.0, 911.0, 387.0, 210.0, 113.0, 60.0, 48.0, 33.0, 20.0, 11.0, 4.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.04296875, -3.922271728515625, -3.80157470703125, -3.680877685546875, -3.5601806640625, -3.439483642578125, -3.31878662109375, -3.198089599609375, -3.077392578125, -2.956695556640625, -2.83599853515625, -2.715301513671875, -2.5946044921875, -2.473907470703125, -2.35321044921875, -2.232513427734375, -2.11181640625, -1.991119384765625, -1.87042236328125, -1.749725341796875, -1.6290283203125, -1.508331298828125, -1.38763427734375, -1.266937255859375, -1.146240234375, -1.025543212890625, -0.90484619140625, -0.784149169921875, -0.6634521484375, -0.542755126953125, -0.42205810546875, -0.301361083984375, -0.1806640625, -0.059967041015625, 0.06072998046875, 0.181427001953125, 0.3021240234375, 0.422821044921875, 0.54351806640625, 0.664215087890625, 0.784912109375, 0.905609130859375, 1.02630615234375, 1.147003173828125, 1.2677001953125, 1.388397216796875, 1.50909423828125, 1.629791259765625, 1.75048828125, 1.871185302734375, 1.99188232421875, 2.112579345703125, 2.2332763671875, 2.353973388671875, 2.47467041015625, 2.595367431640625, 2.716064453125, 2.836761474609375, 2.95745849609375, 3.078155517578125, 3.1988525390625, 3.319549560546875, 3.44024658203125, 3.560943603515625, 3.681640625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 6.0, 18.0, 9.0, 16.0, 29.0, 40.0, 60.0, 78.0, 134.0, 229.0, 509.0, 1385.0, 740.0, 336.0, 139.0, 105.0, 74.0, 54.0, 29.0, 17.0, 8.0, 18.0, 10.0, 8.0, 8.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.521484375, -0.49852752685546875, -0.4755706787109375, -0.45261383056640625, -0.429656982421875, -0.40670013427734375, -0.3837432861328125, -0.36078643798828125, -0.33782958984375, -0.31487274169921875, -0.2919158935546875, -0.26895904541015625, -0.246002197265625, -0.22304534912109375, -0.2000885009765625, -0.17713165283203125, -0.1541748046875, -0.13121795654296875, -0.1082611083984375, -0.08530426025390625, -0.062347412109375, -0.03939056396484375, -0.0164337158203125, 0.00652313232421875, 0.02947998046875, 0.05243682861328125, 0.0753936767578125, 0.09835052490234375, 0.121307373046875, 0.14426422119140625, 0.1672210693359375, 0.19017791748046875, 0.213134765625, 0.23609161376953125, 0.2590484619140625, 0.28200531005859375, 0.304962158203125, 0.32791900634765625, 0.3508758544921875, 0.37383270263671875, 0.39678955078125, 0.41974639892578125, 0.4427032470703125, 0.46566009521484375, 0.488616943359375, 0.5115737915039062, 0.5345306396484375, 0.5574874877929688, 0.5804443359375, 0.6034011840820312, 0.6263580322265625, 0.6493148803710938, 0.672271728515625, 0.6952285766601562, 0.7181854248046875, 0.7411422729492188, 0.76409912109375, 0.7870559692382812, 0.8100128173828125, 0.8329696655273438, 0.855926513671875, 0.8788833618164062, 0.9018402099609375, 0.9247970581054688, 0.94775390625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 4.0, 4.0, 6.0, 8.0, 17.0, 16.0, 21.0, 35.0, 60.0, 75.0, 132.0, 155.0, 118.0, 115.0, 96.0, 46.0, 21.0, 21.0, 12.0, 6.0, 8.0, 9.0, 7.0, 2.0, 3.0, 3.0, 0.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.8963539600372314, -3.803611993789673, -3.7108700275421143, -3.6181280612945557, -3.525386095046997, -3.4326441287994385, -3.339901924133301, -3.247159957885742, -3.1544179916381836, -3.061676025390625, -2.9689340591430664, -2.876192092895508, -2.783450126647949, -2.6907081604003906, -2.597966194152832, -2.5052242279052734, -2.412482261657715, -2.3197402954101562, -2.2269983291625977, -2.134256362915039, -2.0415143966674805, -1.9487724304199219, -1.8560303449630737, -1.7632883787155151, -1.6705464124679565, -1.577804446220398, -1.4850624799728394, -1.3923203945159912, -1.2995784282684326, -1.206836462020874, -1.1140944957733154, -1.0213525295257568, -0.9286103248596191, -0.8358683586120605, -0.743126392364502, -0.6503843665122986, -0.55764240026474, -0.4649004340171814, -0.372158408164978, -0.27941644191741943, -0.18667447566986084, -0.09393249452114105, -0.0011905133724212646, 0.09155148267745972, 0.1842934489250183, 0.2770354151725769, 0.3697774410247803, 0.46251940727233887, 0.5552613735198975, 0.648003339767456, 0.7407453060150146, 0.833487331867218, 0.9262292981147766, 1.0189712047576904, 1.1117132902145386, 1.2044552564620972, 1.2971972227096558, 1.3899391889572144, 1.482681155204773, 1.575423240661621, 1.6681652069091797, 1.7609071731567383, 1.8536491394042969, 1.9463911056518555, 2.039133071899414]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 8.0, 10.0, 10.0, 14.0, 8.0, 23.0, 31.0, 54.0, 52.0, 69.0, 67.0, 86.0, 84.0, 86.0, 70.0, 90.0, 59.0, 50.0, 44.0, 21.0, 23.0, 15.0, 8.0, 6.0, 6.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8984811305999756, -1.8194431066513062, -1.7404050827026367, -1.6613669395446777, -1.5823289155960083, -1.5032908916473389, -1.4242527484893799, -1.3452147245407104, -1.266176700592041, -1.1871386766433716, -1.1081006526947021, -1.0290625095367432, -0.9500244855880737, -0.8709864616394043, -0.7919483780860901, -0.7129102945327759, -0.6338722705841064, -0.554834246635437, -0.4757961630821228, -0.396758109331131, -0.31772005558013916, -0.23868200182914734, -0.15964394807815552, -0.08060586452484131, -0.001567840576171875, 0.07747021317481995, 0.15650826692581177, 0.2355463206768036, 0.3145843744277954, 0.39362242817878723, 0.47266048192977905, 0.5516985654830933, 0.6307363510131836, 0.709774374961853, 0.7888124585151672, 0.8678505420684814, 0.9468885660171509, 1.0259265899658203, 1.1049647331237793, 1.1840027570724487, 1.2630407810211182, 1.3420788049697876, 1.421116828918457, 1.500154972076416, 1.5791929960250854, 1.6582310199737549, 1.7372691631317139, 1.8163071870803833, 1.8953452110290527, 1.9743832349777222, 2.0534212589263916, 2.1324594020843506, 2.2114973068237305, 2.2905354499816895, 2.3695735931396484, 2.4486117362976074, 2.5276496410369873, 2.6066877841949463, 2.685725688934326, 2.764763832092285, 2.843801975250244, 2.922839879989624, 3.001878023147583, 3.080915927886963, 3.159954071044922]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 6.0, 6.0, 8.0, 15.0, 15.0, 35.0, 75.0, 113.0, 240.0, 649.0, 1943.0, 11430.0, 528160.0, 491580.0, 11360.0, 1804.0, 591.0, 225.0, 134.0, 62.0, 36.0, 27.0, 13.0, 15.0, 4.0, 6.0, 1.0, 5.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4267578125, -0.4145622253417969, -0.40236663818359375, -0.3901710510253906, -0.3779754638671875, -0.3657798767089844, -0.35358428955078125, -0.3413887023925781, -0.329193115234375, -0.3169975280761719, -0.30480194091796875, -0.2926063537597656, -0.2804107666015625, -0.2682151794433594, -0.25601959228515625, -0.24382400512695312, -0.23162841796875, -0.21943283081054688, -0.20723724365234375, -0.19504165649414062, -0.1828460693359375, -0.17065048217773438, -0.15845489501953125, -0.14625930786132812, -0.134063720703125, -0.12186813354492188, -0.10967254638671875, -0.09747695922851562, -0.0852813720703125, -0.07308578491210938, -0.06089019775390625, -0.048694610595703125, -0.0364990234375, -0.024303436279296875, -0.01210784912109375, 8.7738037109375e-05, 0.0122833251953125, 0.024478912353515625, 0.03667449951171875, 0.048870086669921875, 0.061065673828125, 0.07326126098632812, 0.08545684814453125, 0.09765243530273438, 0.1098480224609375, 0.12204360961914062, 0.13423919677734375, 0.14643478393554688, 0.15863037109375, 0.17082595825195312, 0.18302154541015625, 0.19521713256835938, 0.2074127197265625, 0.21960830688476562, 0.23180389404296875, 0.24399948120117188, 0.256195068359375, 0.2683906555175781, 0.28058624267578125, 0.2927818298339844, 0.3049774169921875, 0.3171730041503906, 0.32936859130859375, 0.3415641784667969, 0.353759765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 11.0, 16.0, 9.0, 24.0, 26.0, 56.0, 79.0, 88.0, 117.0, 113.0, 110.0, 117.0, 71.0, 57.0, 39.0, 26.0, 14.0, 10.0, 4.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9306640625, -1.8579864501953125, -1.785308837890625, -1.7126312255859375, -1.63995361328125, -1.5672760009765625, -1.494598388671875, -1.4219207763671875, -1.3492431640625, -1.2765655517578125, -1.203887939453125, -1.1312103271484375, -1.05853271484375, -0.9858551025390625, -0.913177490234375, -0.8404998779296875, -0.767822265625, -0.6951446533203125, -0.622467041015625, -0.5497894287109375, -0.47711181640625, -0.4044342041015625, -0.331756591796875, -0.2590789794921875, -0.1864013671875, -0.1137237548828125, -0.041046142578125, 0.0316314697265625, 0.10430908203125, 0.1769866943359375, 0.249664306640625, 0.3223419189453125, 0.39501953125, 0.4676971435546875, 0.540374755859375, 0.6130523681640625, 0.68572998046875, 0.7584075927734375, 0.831085205078125, 0.9037628173828125, 0.9764404296875, 1.0491180419921875, 1.121795654296875, 1.1944732666015625, 1.26715087890625, 1.3398284912109375, 1.412506103515625, 1.4851837158203125, 1.557861328125, 1.6305389404296875, 1.703216552734375, 1.7758941650390625, 1.84857177734375, 1.9212493896484375, 1.993927001953125, 2.0666046142578125, 2.1392822265625, 2.2119598388671875, 2.284637451171875, 2.3573150634765625, 2.42999267578125, 2.5026702880859375, 2.575347900390625, 2.6480255126953125, 2.720703125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 6.0, 5.0, 10.0, 15.0, 8.0, 18.0, 31.0, 34.0, 37.0, 52.0, 57.0, 83.0, 96.0, 126.0, 210.0, 360.0, 909.0, 3873.0, 32108.0, 520308.0, 458045.0, 26672.0, 3554.0, 856.0, 352.0, 198.0, 138.0, 106.0, 68.0, 48.0, 32.0, 29.0, 28.0, 17.0, 17.0, 8.0, 5.0, 5.0, 5.0, 1.0, 3.0, 5.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.198486328125, -0.1920795440673828, -0.18567276000976562, -0.17926597595214844, -0.17285919189453125, -0.16645240783691406, -0.16004562377929688, -0.1536388397216797, -0.1472320556640625, -0.1408252716064453, -0.13441848754882812, -0.12801170349121094, -0.12160491943359375, -0.11519813537597656, -0.10879135131835938, -0.10238456726074219, -0.095977783203125, -0.08957099914550781, -0.08316421508789062, -0.07675743103027344, -0.07035064697265625, -0.06394386291503906, -0.057537078857421875, -0.05113029479980469, -0.0447235107421875, -0.03831672668457031, -0.031909942626953125, -0.025503158569335938, -0.01909637451171875, -0.012689590454101562, -0.006282806396484375, 0.0001239776611328125, 0.00653076171875, 0.012937545776367188, 0.019344329833984375, 0.025751113891601562, 0.03215789794921875, 0.03856468200683594, 0.044971466064453125, 0.05137825012207031, 0.0577850341796875, 0.06419181823730469, 0.07059860229492188, 0.07700538635253906, 0.08341217041015625, 0.08981895446777344, 0.09622573852539062, 0.10263252258300781, 0.109039306640625, 0.11544609069824219, 0.12185287475585938, 0.12825965881347656, 0.13466644287109375, 0.14107322692871094, 0.14748001098632812, 0.1538867950439453, 0.1602935791015625, 0.1667003631591797, 0.17310714721679688, 0.17951393127441406, 0.18592071533203125, 0.19232749938964844, 0.19873428344726562, 0.2051410675048828, 0.2115478515625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 4.0, 6.0, 4.0, 6.0, 5.0, 10.0, 7.0, 18.0, 23.0, 13.0, 28.0, 28.0, 46.0, 31.0, 36.0, 34.0, 39.0, 52.0, 35.0, 60.0, 55.0, 42.0, 43.0, 47.0, 51.0, 34.0, 30.0, 28.0, 36.0, 26.0, 28.0, 14.0, 17.0, 13.0, 10.0, 10.0, 4.0, 4.0, 7.0, 4.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.103515625, -2.03765869140625, -1.9718017578125, -1.90594482421875, -1.840087890625, -1.77423095703125, -1.7083740234375, -1.64251708984375, -1.57666015625, -1.51080322265625, -1.4449462890625, -1.37908935546875, -1.313232421875, -1.24737548828125, -1.1815185546875, -1.11566162109375, -1.0498046875, -0.98394775390625, -0.9180908203125, -0.85223388671875, -0.786376953125, -0.72052001953125, -0.6546630859375, -0.58880615234375, -0.52294921875, -0.45709228515625, -0.3912353515625, -0.32537841796875, -0.259521484375, -0.19366455078125, -0.1278076171875, -0.06195068359375, 0.00390625, 0.06976318359375, 0.1356201171875, 0.20147705078125, 0.267333984375, 0.33319091796875, 0.3990478515625, 0.46490478515625, 0.53076171875, 0.59661865234375, 0.6624755859375, 0.72833251953125, 0.794189453125, 0.86004638671875, 0.9259033203125, 0.99176025390625, 1.0576171875, 1.12347412109375, 1.1893310546875, 1.25518798828125, 1.321044921875, 1.38690185546875, 1.4527587890625, 1.51861572265625, 1.58447265625, 1.65032958984375, 1.7161865234375, 1.78204345703125, 1.847900390625, 1.91375732421875, 1.9796142578125, 2.04547119140625, 2.111328125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 8.0, 9.0, 11.0, 17.0, 19.0, 42.0, 78.0, 182.0, 537.0, 3739.0, 1036724.0, 6224.0, 618.0, 149.0, 73.0, 38.0, 16.0, 15.0, 15.0, 10.0, 7.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11407470703125, -0.10943317413330078, -0.10479164123535156, -0.10015010833740234, -0.09550857543945312, -0.0908670425415039, -0.08622550964355469, -0.08158397674560547, -0.07694244384765625, -0.07230091094970703, -0.06765937805175781, -0.0630178451538086, -0.058376312255859375, -0.053734779357910156, -0.04909324645996094, -0.04445171356201172, -0.0398101806640625, -0.03516864776611328, -0.030527114868164062, -0.025885581970214844, -0.021244049072265625, -0.016602516174316406, -0.011960983276367188, -0.007319450378417969, -0.00267791748046875, 0.0019636154174804688, 0.0066051483154296875, 0.011246681213378906, 0.015888214111328125, 0.020529747009277344, 0.025171279907226562, 0.02981281280517578, 0.034454345703125, 0.03909587860107422, 0.04373741149902344, 0.048378944396972656, 0.053020477294921875, 0.057662010192871094, 0.06230354309082031, 0.06694507598876953, 0.07158660888671875, 0.07622814178466797, 0.08086967468261719, 0.0855112075805664, 0.09015274047851562, 0.09479427337646484, 0.09943580627441406, 0.10407733917236328, 0.1087188720703125, 0.11336040496826172, 0.11800193786621094, 0.12264347076416016, 0.12728500366210938, 0.1319265365600586, 0.1365680694580078, 0.14120960235595703, 0.14585113525390625, 0.15049266815185547, 0.1551342010498047, 0.1597757339477539, 0.16441726684570312, 0.16905879974365234, 0.17370033264160156, 0.17834186553955078, 0.1829833984375]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 3.0, 11.0, 12.0, 21.0, 41.0, 56.0, 103.0, 187.0, 182.0, 168.0, 99.0, 49.0, 25.0, 19.0, 8.0, 5.0, 3.0, 5.0, 3.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8789043426513672e-05, -2.7995556592941284e-05, -2.7202069759368896e-05, -2.640858292579651e-05, -2.561509609222412e-05, -2.4821609258651733e-05, -2.4028122425079346e-05, -2.3234635591506958e-05, -2.244114875793457e-05, -2.1647661924362183e-05, -2.0854175090789795e-05, -2.0060688257217407e-05, -1.926720142364502e-05, -1.8473714590072632e-05, -1.7680227756500244e-05, -1.6886740922927856e-05, -1.609325408935547e-05, -1.529976725578308e-05, -1.4506280422210693e-05, -1.3712793588638306e-05, -1.2919306755065918e-05, -1.212581992149353e-05, -1.1332333087921143e-05, -1.0538846254348755e-05, -9.745359420776367e-06, -8.95187258720398e-06, -8.158385753631592e-06, -7.364898920059204e-06, -6.571412086486816e-06, -5.777925252914429e-06, -4.984438419342041e-06, -4.190951585769653e-06, -3.3974647521972656e-06, -2.603977918624878e-06, -1.8104910850524902e-06, -1.0170042514801025e-06, -2.2351741790771484e-07, 5.699694156646729e-07, 1.3634562492370605e-06, 2.1569430828094482e-06, 2.950429916381836e-06, 3.7439167499542236e-06, 4.537403583526611e-06, 5.330890417098999e-06, 6.124377250671387e-06, 6.917864084243774e-06, 7.711350917816162e-06, 8.50483775138855e-06, 9.298324584960938e-06, 1.0091811418533325e-05, 1.0885298252105713e-05, 1.16787850856781e-05, 1.2472271919250488e-05, 1.3265758752822876e-05, 1.4059245586395264e-05, 1.4852732419967651e-05, 1.564621925354004e-05, 1.6439706087112427e-05, 1.7233192920684814e-05, 1.8026679754257202e-05, 1.882016658782959e-05, 1.9613653421401978e-05, 2.0407140254974365e-05, 2.1200627088546753e-05, 2.199411392211914e-05]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 12.0, 14.0, 22.0, 38.0, 73.0, 97.0, 206.0, 330.0, 982.0, 5535.0, 868427.0, 167249.0, 3921.0, 857.0, 324.0, 172.0, 87.0, 48.0, 44.0, 20.0, 24.0, 18.0, 14.0, 15.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.1578369140625, -0.1535625457763672, -0.14928817749023438, -0.14501380920410156, -0.14073944091796875, -0.13646507263183594, -0.13219070434570312, -0.1279163360595703, -0.1236419677734375, -0.11936759948730469, -0.11509323120117188, -0.11081886291503906, -0.10654449462890625, -0.10227012634277344, -0.09799575805664062, -0.09372138977050781, -0.089447021484375, -0.08517265319824219, -0.08089828491210938, -0.07662391662597656, -0.07234954833984375, -0.06807518005371094, -0.06380081176757812, -0.05952644348144531, -0.0552520751953125, -0.05097770690917969, -0.046703338623046875, -0.04242897033691406, -0.03815460205078125, -0.03388023376464844, -0.029605865478515625, -0.025331497192382812, -0.02105712890625, -0.016782760620117188, -0.012508392333984375, -0.008234024047851562, -0.00395965576171875, 0.0003147125244140625, 0.004589080810546875, 0.008863449096679688, 0.0131378173828125, 0.017412185668945312, 0.021686553955078125, 0.025960922241210938, 0.03023529052734375, 0.03450965881347656, 0.038784027099609375, 0.04305839538574219, 0.047332763671875, 0.05160713195800781, 0.055881500244140625, 0.06015586853027344, 0.06443023681640625, 0.06870460510253906, 0.07297897338867188, 0.07725334167480469, 0.0815277099609375, 0.08580207824707031, 0.09007644653320312, 0.09435081481933594, 0.09862518310546875, 0.10289955139160156, 0.10717391967773438, 0.11144828796386719, 0.11572265625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 10.0, 57.0, 528.0, 312.0, 44.0, 16.0, 3.0, 5.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0416259765625, -0.040738701820373535, -0.03985142707824707, -0.038964152336120605, -0.03807687759399414, -0.037189602851867676, -0.03630232810974121, -0.035415053367614746, -0.03452777862548828, -0.033640503883361816, -0.03275322914123535, -0.03186595439910889, -0.030978679656982422, -0.030091404914855957, -0.029204130172729492, -0.028316855430603027, -0.027429580688476562, -0.026542305946350098, -0.025655031204223633, -0.024767756462097168, -0.023880481719970703, -0.02299320697784424, -0.022105932235717773, -0.02121865749359131, -0.020331382751464844, -0.01944410800933838, -0.018556833267211914, -0.01766955852508545, -0.016782283782958984, -0.01589500904083252, -0.015007734298706055, -0.01412045955657959, -0.013233184814453125, -0.01234591007232666, -0.011458635330200195, -0.01057136058807373, -0.009684085845947266, -0.0087968111038208, -0.007909536361694336, -0.007022261619567871, -0.006134986877441406, -0.005247712135314941, -0.0043604373931884766, -0.0034731626510620117, -0.002585887908935547, -0.001698613166809082, -0.0008113384246826172, 7.593631744384766e-05, 0.0009632110595703125, 0.0018504858016967773, 0.002737760543823242, 0.003625035285949707, 0.004512310028076172, 0.005399584770202637, 0.0062868595123291016, 0.007174134254455566, 0.008061408996582031, 0.008948683738708496, 0.009835958480834961, 0.010723233222961426, 0.01161050796508789, 0.012497782707214355, 0.01338505744934082, 0.014272332191467285, 0.01515960693359375]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 8.0, 10.0, 21.0, 35.0, 67.0, 144.0, 216.0, 213.0, 146.0, 61.0, 23.0, 15.0, 10.0, 18.0, 2.0, 4.0, 1.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1042208671569824, -3.0072691440582275, -2.9103174209594727, -2.8133656978607178, -2.716413974761963, -2.619462251663208, -2.522510528564453, -2.425558567047119, -2.3286070823669434, -2.2316553592681885, -2.1347036361694336, -2.0377519130706787, -1.9408001899719238, -1.843848466873169, -1.7468966245651245, -1.6499449014663696, -1.5529930591583252, -1.4560413360595703, -1.3590896129608154, -1.2621378898620605, -1.1651861667633057, -1.0682344436645508, -0.9712826013565063, -0.8743308782577515, -0.7773791551589966, -0.6804274320602417, -0.5834757089614868, -0.48652392625808716, -0.3895722031593323, -0.2926204800605774, -0.19566869735717773, -0.09871697425842285, -0.0017652511596679688, 0.09518648684024811, 0.19213822484016418, 0.28908997774124146, 0.38604170083999634, 0.4829934239387512, 0.5799452066421509, 0.6768969297409058, 0.7738486528396606, 0.8708003759384155, 0.9677520990371704, 1.0647039413452148, 1.1616556644439697, 1.2586073875427246, 1.3555591106414795, 1.4525108337402344, 1.5494625568389893, 1.6464142799377441, 1.743366003036499, 1.840317726135254, 1.9372694492340088, 2.0342211723327637, 2.1311731338500977, 2.2281246185302734, 2.3250765800476074, 2.4220283031463623, 2.518980026245117, 2.615931749343872, 2.712883472442627, 2.809835195541382, 2.9067869186401367, 3.0037388801574707, 3.1006903648376465]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 12.0, 12.0, 15.0, 22.0, 28.0, 58.0, 64.0, 88.0, 108.0, 108.0, 99.0, 100.0, 83.0, 64.0, 52.0, 28.0, 16.0, 13.0, 7.0, 7.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5358527898788452, -1.4713879823684692, -1.4069232940673828, -1.3424584865570068, -1.2779936790466309, -1.2135288715362549, -1.1490641832351685, -1.0845993757247925, -1.020134687423706, -0.9556699395179749, -0.8912051320075989, -0.8267403841018677, -0.7622755765914917, -0.6978108286857605, -0.6333460807800293, -0.5688812732696533, -0.5044164657592773, -0.43995168805122375, -0.37548691034317017, -0.31102216243743896, -0.24655738472938538, -0.1820926070213318, -0.11762785911560059, -0.053163081407547, 0.011301696300506592, 0.07576646655797958, 0.14023123681545258, 0.20469599962234497, 0.26916077733039856, 0.33362555503845215, 0.39809030294418335, 0.46255508065223694, 0.5270199775695801, 0.5914847254753113, 0.6559495329856873, 0.7204142808914185, 0.7848790884017944, 0.8493438363075256, 0.9138085842132568, 0.9782733917236328, 1.0427381992340088, 1.1072030067443848, 1.1716676950454712, 1.2361325025558472, 1.3005973100662231, 1.3650619983673096, 1.4295268058776855, 1.4939916133880615, 1.558456301689148, 1.622921109199524, 1.6873857975006104, 1.7518506050109863, 1.8163154125213623, 1.8807802200317383, 1.9452449083328247, 2.009709596633911, 2.074174404144287, 2.138639211654663, 2.203104019165039, 2.267568588256836, 2.332033395767212, 2.396498203277588, 2.460963010787964, 2.52542781829834, 2.589892625808716]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 5.0, 6.0, 6.0, 13.0, 14.0, 22.0, 30.0, 61.0, 101.0, 192.0, 408.0, 970.0, 2563.0, 8018.0, 38611.0, 637087.0, 323312.0, 27308.0, 6223.0, 2036.0, 824.0, 307.0, 203.0, 89.0, 65.0, 28.0, 24.0, 8.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.96533203125, -0.9249496459960938, -0.8845672607421875, -0.8441848754882812, -0.803802490234375, -0.7634201049804688, -0.7230377197265625, -0.6826553344726562, -0.64227294921875, -0.6018905639648438, -0.5615081787109375, -0.5211257934570312, -0.480743408203125, -0.44036102294921875, -0.3999786376953125, -0.35959625244140625, -0.3192138671875, -0.27883148193359375, -0.2384490966796875, -0.19806671142578125, -0.157684326171875, -0.11730194091796875, -0.0769195556640625, -0.03653717041015625, 0.00384521484375, 0.04422760009765625, 0.0846099853515625, 0.12499237060546875, 0.165374755859375, 0.20575714111328125, 0.2461395263671875, 0.28652191162109375, 0.326904296875, 0.36728668212890625, 0.4076690673828125, 0.44805145263671875, 0.488433837890625, 0.5288162231445312, 0.5691986083984375, 0.6095809936523438, 0.64996337890625, 0.6903457641601562, 0.7307281494140625, 0.7711105346679688, 0.811492919921875, 0.8518753051757812, 0.8922576904296875, 0.9326400756835938, 0.9730224609375, 1.0134048461914062, 1.0537872314453125, 1.0941696166992188, 1.134552001953125, 1.1749343872070312, 1.2153167724609375, 1.2556991577148438, 1.29608154296875, 1.3364639282226562, 1.3768463134765625, 1.4172286987304688, 1.457611083984375, 1.4979934692382812, 1.5383758544921875, 1.5787582397460938, 1.619140625]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 8.0, 13.0, 14.0, 17.0, 34.0, 40.0, 58.0, 57.0, 88.0, 84.0, 100.0, 91.0, 91.0, 65.0, 63.0, 43.0, 41.0, 26.0, 19.0, 7.0, 3.0, 10.0, 1.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.46807861328125, -2.3541259765625, -2.24017333984375, -2.126220703125, -2.01226806640625, -1.8983154296875, -1.78436279296875, -1.67041015625, -1.55645751953125, -1.4425048828125, -1.32855224609375, -1.214599609375, -1.10064697265625, -0.9866943359375, -0.87274169921875, -0.7587890625, -0.64483642578125, -0.5308837890625, -0.41693115234375, -0.302978515625, -0.18902587890625, -0.0750732421875, 0.03887939453125, 0.15283203125, 0.26678466796875, 0.3807373046875, 0.49468994140625, 0.608642578125, 0.72259521484375, 0.8365478515625, 0.95050048828125, 1.064453125, 1.17840576171875, 1.2923583984375, 1.40631103515625, 1.520263671875, 1.63421630859375, 1.7481689453125, 1.86212158203125, 1.97607421875, 2.09002685546875, 2.2039794921875, 2.31793212890625, 2.431884765625, 2.54583740234375, 2.6597900390625, 2.77374267578125, 2.8876953125, 3.00164794921875, 3.1156005859375, 3.22955322265625, 3.343505859375, 3.45745849609375, 3.5714111328125, 3.68536376953125, 3.79931640625, 3.91326904296875, 4.0272216796875, 4.14117431640625, 4.255126953125, 4.36907958984375, 4.4830322265625, 4.59698486328125, 4.7109375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 7.0, 7.0, 11.0, 14.0, 19.0, 22.0, 33.0, 41.0, 76.0, 91.0, 182.0, 340.0, 1050.0, 8592.0, 942608.0, 91489.0, 2736.0, 602.0, 227.0, 114.0, 73.0, 55.0, 33.0, 22.0, 19.0, 26.0, 10.0, 12.0, 9.0, 6.0, 2.0, 8.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-2.7734375, -2.693695068359375, -2.61395263671875, -2.534210205078125, -2.4544677734375, -2.374725341796875, -2.29498291015625, -2.215240478515625, -2.135498046875, -2.055755615234375, -1.97601318359375, -1.896270751953125, -1.8165283203125, -1.736785888671875, -1.65704345703125, -1.577301025390625, -1.49755859375, -1.417816162109375, -1.33807373046875, -1.258331298828125, -1.1785888671875, -1.098846435546875, -1.01910400390625, -0.939361572265625, -0.859619140625, -0.779876708984375, -0.70013427734375, -0.620391845703125, -0.5406494140625, -0.460906982421875, -0.38116455078125, -0.301422119140625, -0.2216796875, -0.141937255859375, -0.06219482421875, 0.017547607421875, 0.0972900390625, 0.177032470703125, 0.25677490234375, 0.336517333984375, 0.416259765625, 0.496002197265625, 0.57574462890625, 0.655487060546875, 0.7352294921875, 0.814971923828125, 0.89471435546875, 0.974456787109375, 1.05419921875, 1.133941650390625, 1.21368408203125, 1.293426513671875, 1.3731689453125, 1.452911376953125, 1.53265380859375, 1.612396240234375, 1.692138671875, 1.771881103515625, 1.85162353515625, 1.931365966796875, 2.0111083984375, 2.090850830078125, 2.17059326171875, 2.250335693359375, 2.330078125]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 6.0, 14.0, 10.0, 9.0, 7.0, 17.0, 11.0, 32.0, 22.0, 26.0, 40.0, 48.0, 53.0, 52.0, 60.0, 65.0, 54.0, 59.0, 65.0, 46.0, 42.0, 40.0, 40.0, 26.0, 22.0, 29.0, 22.0, 21.0, 13.0, 12.0, 4.0, 4.0, 8.0, 9.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.501953125, -3.401214599609375, -3.30047607421875, -3.199737548828125, -3.0989990234375, -2.998260498046875, -2.89752197265625, -2.796783447265625, -2.696044921875, -2.595306396484375, -2.49456787109375, -2.393829345703125, -2.2930908203125, -2.192352294921875, -2.09161376953125, -1.990875244140625, -1.89013671875, -1.789398193359375, -1.68865966796875, -1.587921142578125, -1.4871826171875, -1.386444091796875, -1.28570556640625, -1.184967041015625, -1.084228515625, -0.983489990234375, -0.88275146484375, -0.782012939453125, -0.6812744140625, -0.580535888671875, -0.47979736328125, -0.379058837890625, -0.2783203125, -0.177581787109375, -0.07684326171875, 0.023895263671875, 0.1246337890625, 0.225372314453125, 0.32611083984375, 0.426849365234375, 0.527587890625, 0.628326416015625, 0.72906494140625, 0.829803466796875, 0.9305419921875, 1.031280517578125, 1.13201904296875, 1.232757568359375, 1.33349609375, 1.434234619140625, 1.53497314453125, 1.635711669921875, 1.7364501953125, 1.837188720703125, 1.93792724609375, 2.038665771484375, 2.139404296875, 2.240142822265625, 2.34088134765625, 2.441619873046875, 2.5423583984375, 2.643096923828125, 2.74383544921875, 2.844573974609375, 2.9453125]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 4.0, 9.0, 10.0, 9.0, 12.0, 30.0, 31.0, 57.0, 130.0, 221.0, 436.0, 1068.0, 3990.0, 28863.0, 876714.0, 122806.0, 10578.0, 2092.0, 739.0, 311.0, 168.0, 80.0, 65.0, 35.0, 35.0, 19.0, 14.0, 5.0, 6.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.83447265625, -0.8129501342773438, -0.7914276123046875, -0.7699050903320312, -0.748382568359375, -0.7268600463867188, -0.7053375244140625, -0.6838150024414062, -0.66229248046875, -0.6407699584960938, -0.6192474365234375, -0.5977249145507812, -0.576202392578125, -0.5546798706054688, -0.5331573486328125, -0.5116348266601562, -0.4901123046875, -0.46858978271484375, -0.4470672607421875, -0.42554473876953125, -0.404022216796875, -0.38249969482421875, -0.3609771728515625, -0.33945465087890625, -0.31793212890625, -0.29640960693359375, -0.2748870849609375, -0.25336456298828125, -0.231842041015625, -0.21031951904296875, -0.1887969970703125, -0.16727447509765625, -0.145751953125, -0.12422943115234375, -0.1027069091796875, -0.08118438720703125, -0.059661865234375, -0.03813934326171875, -0.0166168212890625, 0.00490570068359375, 0.02642822265625, 0.04795074462890625, 0.0694732666015625, 0.09099578857421875, 0.112518310546875, 0.13404083251953125, 0.1555633544921875, 0.17708587646484375, 0.1986083984375, 0.22013092041015625, 0.2416534423828125, 0.26317596435546875, 0.284698486328125, 0.30622100830078125, 0.3277435302734375, 0.34926605224609375, 0.37078857421875, 0.39231109619140625, 0.4138336181640625, 0.43535614013671875, 0.456878662109375, 0.47840118408203125, 0.4999237060546875, 0.5214462280273438, 0.54296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 7.0, 5.0, 2.0, 7.0, 9.0, 9.0, 21.0, 22.0, 24.0, 30.0, 48.0, 129.0, 324.0, 148.0, 74.0, 40.0, 35.0, 23.0, 13.0, 11.0, 9.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.611513137817383e-05, -7.384642958641052e-05, -7.157772779464722e-05, -6.930902600288391e-05, -6.70403242111206e-05, -6.47716224193573e-05, -6.2502920627594e-05, -6.023421883583069e-05, -5.796551704406738e-05, -5.569681525230408e-05, -5.342811346054077e-05, -5.1159411668777466e-05, -4.889070987701416e-05, -4.6622008085250854e-05, -4.435330629348755e-05, -4.208460450172424e-05, -3.981590270996094e-05, -3.754720091819763e-05, -3.5278499126434326e-05, -3.300979733467102e-05, -3.0741095542907715e-05, -2.847239375114441e-05, -2.6203691959381104e-05, -2.3934990167617798e-05, -2.1666288375854492e-05, -1.9397586584091187e-05, -1.712888479232788e-05, -1.4860183000564575e-05, -1.259148120880127e-05, -1.0322779417037964e-05, -8.054077625274658e-06, -5.7853758335113525e-06, -3.516674041748047e-06, -1.2479722499847412e-06, 1.0207295417785645e-06, 3.28943133354187e-06, 5.558133125305176e-06, 7.826834917068481e-06, 1.0095536708831787e-05, 1.2364238500595093e-05, 1.4632940292358398e-05, 1.6901642084121704e-05, 1.917034387588501e-05, 2.1439045667648315e-05, 2.370774745941162e-05, 2.5976449251174927e-05, 2.8245151042938232e-05, 3.0513852834701538e-05, 3.2782554626464844e-05, 3.505125641822815e-05, 3.7319958209991455e-05, 3.958866000175476e-05, 4.1857361793518066e-05, 4.412606358528137e-05, 4.639476537704468e-05, 4.8663467168807983e-05, 5.093216896057129e-05, 5.3200870752334595e-05, 5.54695725440979e-05, 5.7738274335861206e-05, 6.000697612762451e-05, 6.227567791938782e-05, 6.454437971115112e-05, 6.681308150291443e-05, 6.908178329467773e-05]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 16.0, 18.0, 19.0, 33.0, 35.0, 56.0, 73.0, 167.0, 285.0, 546.0, 1393.0, 4731.0, 25177.0, 774678.0, 217716.0, 17747.0, 3625.0, 1119.0, 468.0, 245.0, 137.0, 87.0, 52.0, 37.0, 17.0, 20.0, 11.0, 6.0, 8.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.681640625, -0.6609268188476562, -0.6402130126953125, -0.6194992065429688, -0.598785400390625, -0.5780715942382812, -0.5573577880859375, -0.5366439819335938, -0.51593017578125, -0.49521636962890625, -0.4745025634765625, -0.45378875732421875, -0.433074951171875, -0.41236114501953125, -0.3916473388671875, -0.37093353271484375, -0.3502197265625, -0.32950592041015625, -0.3087921142578125, -0.28807830810546875, -0.267364501953125, -0.24665069580078125, -0.2259368896484375, -0.20522308349609375, -0.18450927734375, -0.16379547119140625, -0.1430816650390625, -0.12236785888671875, -0.101654052734375, -0.08094024658203125, -0.0602264404296875, -0.03951263427734375, -0.018798828125, 0.00191497802734375, 0.0226287841796875, 0.04334259033203125, 0.064056396484375, 0.08477020263671875, 0.1054840087890625, 0.12619781494140625, 0.14691162109375, 0.16762542724609375, 0.1883392333984375, 0.20905303955078125, 0.229766845703125, 0.25048065185546875, 0.2711944580078125, 0.29190826416015625, 0.3126220703125, 0.33333587646484375, 0.3540496826171875, 0.37476348876953125, 0.395477294921875, 0.41619110107421875, 0.4369049072265625, 0.45761871337890625, 0.47833251953125, 0.49904632568359375, 0.5197601318359375, 0.5404739379882812, 0.561187744140625, 0.5819015502929688, 0.6026153564453125, 0.6233291625976562, 0.64404296875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 2.0, 2.0, 4.0, 11.0, 4.0, 12.0, 18.0, 21.0, 31.0, 55.0, 95.0, 399.0, 157.0, 61.0, 38.0, 17.0, 20.0, 14.0, 7.0, 10.0, 5.0, 4.0, 2.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2993812561035156, -0.29236602783203125, -0.2853507995605469, -0.2783355712890625, -0.2713203430175781, -0.26430511474609375, -0.2572898864746094, -0.250274658203125, -0.24325942993164062, -0.23624420166015625, -0.22922897338867188, -0.2222137451171875, -0.21519851684570312, -0.20818328857421875, -0.20116806030273438, -0.19415283203125, -0.18713760375976562, -0.18012237548828125, -0.17310714721679688, -0.1660919189453125, -0.15907669067382812, -0.15206146240234375, -0.14504623413085938, -0.138031005859375, -0.13101577758789062, -0.12400054931640625, -0.11698532104492188, -0.1099700927734375, -0.10295486450195312, -0.09593963623046875, -0.08892440795898438, -0.0819091796875, -0.07489395141601562, -0.06787872314453125, -0.060863494873046875, -0.0538482666015625, -0.046833038330078125, -0.03981781005859375, -0.032802581787109375, -0.025787353515625, -0.018772125244140625, -0.01175689697265625, -0.004741668701171875, 0.0022735595703125, 0.009288787841796875, 0.01630401611328125, 0.023319244384765625, 0.03033447265625, 0.037349700927734375, 0.04436492919921875, 0.051380157470703125, 0.0583953857421875, 0.06541061401367188, 0.07242584228515625, 0.07944107055664062, 0.086456298828125, 0.09347152709960938, 0.10048675537109375, 0.10750198364257812, 0.1145172119140625, 0.12153244018554688, 0.12854766845703125, 0.13556289672851562, 0.142578125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 17.0, 38.0, 187.0, 502.0, 195.0, 45.0, 18.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.789307594299316, -5.288122653961182, -4.786938190460205, -4.28575325012207, -3.7845685482025146, -3.283383846282959, -2.782198905944824, -2.2810142040252686, -1.779829502105713, -1.2786448001861572, -0.777459979057312, -0.2762751579284668, 0.22490954399108887, 0.7260942459106445, 1.2272791862487793, 1.728463888168335, 2.2296485900878906, 2.7308332920074463, 3.232017993927002, 3.7332029342651367, 4.234387397766113, 4.735572338104248, 5.236757278442383, 5.737941741943359, 6.239126682281494, 6.740311622619629, 7.2414960861206055, 7.74268102645874, 8.243865966796875, 8.745050430297852, 9.246234893798828, 9.747420310974121, 10.248603820800781, 10.749788284301758, 11.25097370147705, 11.752158164978027, 12.253342628479004, 12.754528045654297, 13.255712509155273, 13.75689697265625, 14.258081436157227, 14.759265899658203, 15.260451316833496, 15.761635780334473, 16.262821197509766, 16.764005661010742, 17.26519012451172, 17.766374588012695, 18.267559051513672, 18.76874351501465, 19.269927978515625, 19.771114349365234, 20.27229881286621, 20.773483276367188, 21.274667739868164, 21.77585220336914, 22.27703857421875, 22.778223037719727, 23.279407501220703, 23.780593872070312, 24.28177833557129, 24.782962799072266, 25.284147262573242, 25.78533172607422, 26.286516189575195]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 7.0, 5.0, 10.0, 9.0, 15.0, 7.0, 18.0, 22.0, 24.0, 31.0, 43.0, 43.0, 38.0, 42.0, 46.0, 52.0, 44.0, 45.0, 46.0, 54.0, 34.0, 41.0, 45.0, 42.0, 31.0, 31.0, 35.0, 32.0, 20.0, 22.0, 12.0, 13.0, 10.0, 11.0, 0.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.844492435455322, -4.684164524078369, -4.523837089538574, -4.363509178161621, -4.203181743621826, -4.042853832244873, -3.882526159286499, -3.722198486328125, -3.561870574951172, -3.401542901992798, -3.241215229034424, -3.0808873176574707, -2.9205596446990967, -2.7602319717407227, -2.5999042987823486, -2.4395766258239746, -2.2792489528656006, -2.1189212799072266, -1.958593487739563, -1.798265814781189, -1.6379380226135254, -1.4776103496551514, -1.3172826766967773, -1.1569548845291138, -0.9966272115707397, -0.836299479007721, -0.6759717464447021, -0.5156440734863281, -0.3553163409233093, -0.19498860836029053, -0.034660935401916504, 0.12566685676574707, 0.2859945297241211, 0.4463222622871399, 0.6066499948501587, 0.7669776678085327, 0.9273054003715515, 1.0876331329345703, 1.2479608058929443, 1.408288598060608, 1.568616271018982, 1.728943943977356, 1.8892717361450195, 2.0495994091033936, 2.2099270820617676, 2.3702549934387207, 2.5305824279785156, 2.6909103393554688, 2.8512380123138428, 3.011565685272217, 3.171893358230591, 3.332221031188965, 3.492548942565918, 3.652876615524292, 3.813204288482666, 3.973532199859619, 4.133859634399414, 4.294187545776367, 4.454514980316162, 4.614842891693115, 4.77517032623291, 4.935498237609863, 5.095826148986816, 5.256153583526611, 5.4164814949035645]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 15.0, 15.0, 14.0, 17.0, 26.0, 31.0, 44.0, 66.0, 103.0, 172.0, 243.0, 422.0, 953.0, 2078.0, 6010.0, 22741.0, 176040.0, 3697579.0, 250267.0, 26341.0, 6566.0, 2241.0, 952.0, 495.0, 284.0, 161.0, 97.0, 88.0, 37.0, 41.0, 40.0, 24.0, 16.0, 10.0, 7.0, 9.0, 9.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.60546875, -2.52020263671875, -2.4349365234375, -2.34967041015625, -2.264404296875, -2.17913818359375, -2.0938720703125, -2.00860595703125, -1.92333984375, -1.83807373046875, -1.7528076171875, -1.66754150390625, -1.582275390625, -1.49700927734375, -1.4117431640625, -1.32647705078125, -1.2412109375, -1.15594482421875, -1.0706787109375, -0.98541259765625, -0.900146484375, -0.81488037109375, -0.7296142578125, -0.64434814453125, -0.55908203125, -0.47381591796875, -0.3885498046875, -0.30328369140625, -0.218017578125, -0.13275146484375, -0.0474853515625, 0.03778076171875, 0.123046875, 0.20831298828125, 0.2935791015625, 0.37884521484375, 0.464111328125, 0.54937744140625, 0.6346435546875, 0.71990966796875, 0.80517578125, 0.89044189453125, 0.9757080078125, 1.06097412109375, 1.146240234375, 1.23150634765625, 1.3167724609375, 1.40203857421875, 1.4873046875, 1.57257080078125, 1.6578369140625, 1.74310302734375, 1.828369140625, 1.91363525390625, 1.9989013671875, 2.08416748046875, 2.16943359375, 2.25469970703125, 2.3399658203125, 2.42523193359375, 2.510498046875, 2.59576416015625, 2.6810302734375, 2.76629638671875, 2.8515625]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 1.0, 3.0, 8.0, 14.0, 20.0, 24.0, 46.0, 69.0, 85.0, 115.0, 148.0, 107.0, 109.0, 76.0, 56.0, 35.0, 27.0, 19.0, 5.0, 8.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.10546875, -2.02960205078125, -1.9537353515625, -1.87786865234375, -1.802001953125, -1.72613525390625, -1.6502685546875, -1.57440185546875, -1.49853515625, -1.42266845703125, -1.3468017578125, -1.27093505859375, -1.195068359375, -1.11920166015625, -1.0433349609375, -0.96746826171875, -0.8916015625, -0.81573486328125, -0.7398681640625, -0.66400146484375, -0.588134765625, -0.51226806640625, -0.4364013671875, -0.36053466796875, -0.28466796875, -0.20880126953125, -0.1329345703125, -0.05706787109375, 0.018798828125, 0.09466552734375, 0.1705322265625, 0.24639892578125, 0.322265625, 0.39813232421875, 0.4739990234375, 0.54986572265625, 0.625732421875, 0.70159912109375, 0.7774658203125, 0.85333251953125, 0.92919921875, 1.00506591796875, 1.0809326171875, 1.15679931640625, 1.232666015625, 1.30853271484375, 1.3843994140625, 1.46026611328125, 1.5361328125, 1.61199951171875, 1.6878662109375, 1.76373291015625, 1.839599609375, 1.91546630859375, 1.9913330078125, 2.06719970703125, 2.14306640625, 2.21893310546875, 2.2947998046875, 2.37066650390625, 2.446533203125, 2.52239990234375, 2.5982666015625, 2.67413330078125, 2.75]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 7.0, 5.0, 9.0, 8.0, 11.0, 30.0, 52.0, 78.0, 127.0, 242.0, 515.0, 1633.0, 9900.0, 256773.0, 3883314.0, 36226.0, 3615.0, 905.0, 357.0, 175.0, 106.0, 70.0, 44.0, 27.0, 12.0, 15.0, 7.0, 9.0, 10.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.546875, -4.3668212890625, -4.186767578125, -4.0067138671875, -3.82666015625, -3.6466064453125, -3.466552734375, -3.2864990234375, -3.1064453125, -2.9263916015625, -2.746337890625, -2.5662841796875, -2.38623046875, -2.2061767578125, -2.026123046875, -1.8460693359375, -1.666015625, -1.4859619140625, -1.305908203125, -1.1258544921875, -0.94580078125, -0.7657470703125, -0.585693359375, -0.4056396484375, -0.2255859375, -0.0455322265625, 0.134521484375, 0.3145751953125, 0.49462890625, 0.6746826171875, 0.854736328125, 1.0347900390625, 1.21484375, 1.3948974609375, 1.574951171875, 1.7550048828125, 1.93505859375, 2.1151123046875, 2.295166015625, 2.4752197265625, 2.6552734375, 2.8353271484375, 3.015380859375, 3.1954345703125, 3.37548828125, 3.5555419921875, 3.735595703125, 3.9156494140625, 4.095703125, 4.2757568359375, 4.455810546875, 4.6358642578125, 4.81591796875, 4.9959716796875, 5.176025390625, 5.3560791015625, 5.5361328125, 5.7161865234375, 5.896240234375, 6.0762939453125, 6.25634765625, 6.4364013671875, 6.616455078125, 6.7965087890625, 6.9765625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 7.0, 11.0, 22.0, 39.0, 80.0, 85.0, 221.0, 600.0, 1618.0, 769.0, 288.0, 134.0, 86.0, 42.0, 20.0, 17.0, 8.0, 8.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.543853759765625, -1.50762939453125, -1.471405029296875, -1.4351806640625, -1.398956298828125, -1.36273193359375, -1.326507568359375, -1.290283203125, -1.254058837890625, -1.21783447265625, -1.181610107421875, -1.1453857421875, -1.109161376953125, -1.07293701171875, -1.036712646484375, -1.00048828125, -0.964263916015625, -0.92803955078125, -0.891815185546875, -0.8555908203125, -0.819366455078125, -0.78314208984375, -0.746917724609375, -0.710693359375, -0.674468994140625, -0.63824462890625, -0.602020263671875, -0.5657958984375, -0.529571533203125, -0.49334716796875, -0.457122802734375, -0.4208984375, -0.384674072265625, -0.34844970703125, -0.312225341796875, -0.2760009765625, -0.239776611328125, -0.20355224609375, -0.167327880859375, -0.131103515625, -0.094879150390625, -0.05865478515625, -0.022430419921875, 0.0137939453125, 0.050018310546875, 0.08624267578125, 0.122467041015625, 0.15869140625, 0.194915771484375, 0.23114013671875, 0.267364501953125, 0.3035888671875, 0.339813232421875, 0.37603759765625, 0.412261962890625, 0.448486328125, 0.484710693359375, 0.52093505859375, 0.557159423828125, 0.5933837890625, 0.629608154296875, 0.66583251953125, 0.702056884765625, 0.73828125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 10.0, 4.0, 15.0, 17.0, 27.0, 46.0, 89.0, 114.0, 128.0, 153.0, 118.0, 109.0, 65.0, 33.0, 23.0, 16.0, 8.0, 12.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.197394371032715, -4.085183143615723, -3.9729719161987305, -3.860760450363159, -3.748549222946167, -3.636337995529175, -3.5241265296936035, -3.4119153022766113, -3.299704074859619, -3.187492847442627, -3.0752816200256348, -2.9630701541900635, -2.8508589267730713, -2.738647699356079, -2.626436233520508, -2.5142250061035156, -2.4020137786865234, -2.2898025512695312, -2.177591323852539, -2.0653798580169678, -1.9531686305999756, -1.8409574031829834, -1.7287460565567017, -1.61653470993042, -1.5043234825134277, -1.3921122550964355, -1.2799009084701538, -1.167689561843872, -1.0554783344268799, -0.9432670474052429, -0.831055760383606, -0.718844473361969, -0.6066329479217529, -0.49442166090011597, -0.382210373878479, -0.26999908685684204, -0.15778779983520508, -0.045576512813568115, 0.06663477420806885, 0.1788460612297058, 0.2910573482513428, 0.40326863527297974, 0.5154799222946167, 0.6276912093162537, 0.7399024963378906, 0.8521137833595276, 0.9643250703811646, 1.0765364170074463, 1.1887476444244385, 1.3009588718414307, 1.4131702184677124, 1.5253815650939941, 1.6375927925109863, 1.7498040199279785, 1.8620153665542603, 1.974226713180542, 2.086437940597534, 2.1986491680145264, 2.3108606338500977, 2.42307186126709, 2.535283088684082, 2.647494316101074, 2.7597055435180664, 2.8719170093536377, 2.98412823677063]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 4.0, 16.0, 6.0, 13.0, 19.0, 27.0, 24.0, 33.0, 46.0, 55.0, 52.0, 52.0, 61.0, 75.0, 79.0, 62.0, 70.0, 56.0, 50.0, 26.0, 43.0, 45.0, 23.0, 16.0, 13.0, 13.0, 9.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5341423749923706, -1.4624698162078857, -1.3907971382141113, -1.3191245794296265, -1.2474520206451416, -1.1757793426513672, -1.1041067838668823, -1.0324342250823975, -0.9607616066932678, -0.8890889883041382, -0.8174164295196533, -0.7457438111305237, -0.674071192741394, -0.6023986339569092, -0.5307260155677795, -0.4590534567832947, -0.38738083839416504, -0.3157082498073578, -0.24403564631938934, -0.1723630428314209, -0.10069045424461365, -0.029017865657806396, 0.04265475273132324, 0.1143273115158081, 0.18599992990493774, 0.257672518491745, 0.32934510707855225, 0.4010177254676819, 0.47269031405448914, 0.5443629026412964, 0.616035521030426, 0.6877080798149109, 0.759380578994751, 0.8310531973838806, 0.9027257561683655, 0.9743983745574951, 1.04607093334198, 1.1177434921264648, 1.1894161701202393, 1.2610887289047241, 1.332761287689209, 1.4044338464736938, 1.4761065244674683, 1.5477790832519531, 1.619451642036438, 1.6911242008209229, 1.7627968788146973, 1.8344694375991821, 1.9061421155929565, 1.9778146743774414, 2.049487352371216, 2.1211600303649902, 2.1928324699401855, 2.26450514793396, 2.3361778259277344, 2.4078502655029297, 2.479522943496704, 2.5511956214904785, 2.622868061065674, 2.6945407390594482, 2.7662134170532227, 2.837885856628418, 2.9095585346221924, 2.981231212615967, 3.052903652191162]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 7.0, 7.0, 7.0, 11.0, 8.0, 28.0, 42.0, 51.0, 86.0, 118.0, 178.0, 358.0, 654.0, 1396.0, 4644.0, 45974.0, 868781.0, 115027.0, 7473.0, 1882.0, 745.0, 435.0, 239.0, 126.0, 99.0, 66.0, 49.0, 21.0, 16.0, 3.0, 7.0, 4.0, 7.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.4521484375, -0.43829345703125, -0.4244384765625, -0.41058349609375, -0.396728515625, -0.38287353515625, -0.3690185546875, -0.35516357421875, -0.34130859375, -0.32745361328125, -0.3135986328125, -0.29974365234375, -0.285888671875, -0.27203369140625, -0.2581787109375, -0.24432373046875, -0.23046875, -0.21661376953125, -0.2027587890625, -0.18890380859375, -0.175048828125, -0.16119384765625, -0.1473388671875, -0.13348388671875, -0.11962890625, -0.10577392578125, -0.0919189453125, -0.07806396484375, -0.064208984375, -0.05035400390625, -0.0364990234375, -0.02264404296875, -0.0087890625, 0.00506591796875, 0.0189208984375, 0.03277587890625, 0.046630859375, 0.06048583984375, 0.0743408203125, 0.08819580078125, 0.10205078125, 0.11590576171875, 0.1297607421875, 0.14361572265625, 0.157470703125, 0.17132568359375, 0.1851806640625, 0.19903564453125, 0.212890625, 0.22674560546875, 0.2406005859375, 0.25445556640625, 0.268310546875, 0.28216552734375, 0.2960205078125, 0.30987548828125, 0.32373046875, 0.33758544921875, 0.3514404296875, 0.36529541015625, 0.379150390625, 0.39300537109375, 0.4068603515625, 0.42071533203125, 0.4345703125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 8.0, 14.0, 10.0, 15.0, 15.0, 26.0, 41.0, 39.0, 49.0, 55.0, 73.0, 73.0, 65.0, 68.0, 76.0, 64.0, 69.0, 53.0, 44.0, 35.0, 34.0, 18.0, 15.0, 12.0, 8.0, 9.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4208984375, -1.3621063232421875, -1.303314208984375, -1.2445220947265625, -1.18572998046875, -1.1269378662109375, -1.068145751953125, -1.0093536376953125, -0.9505615234375, -0.8917694091796875, -0.832977294921875, -0.7741851806640625, -0.71539306640625, -0.6566009521484375, -0.597808837890625, -0.5390167236328125, -0.480224609375, -0.4214324951171875, -0.362640380859375, -0.3038482666015625, -0.24505615234375, -0.1862640380859375, -0.127471923828125, -0.0686798095703125, -0.0098876953125, 0.0489044189453125, 0.107696533203125, 0.1664886474609375, 0.22528076171875, 0.2840728759765625, 0.342864990234375, 0.4016571044921875, 0.46044921875, 0.5192413330078125, 0.578033447265625, 0.6368255615234375, 0.69561767578125, 0.7544097900390625, 0.813201904296875, 0.8719940185546875, 0.9307861328125, 0.9895782470703125, 1.048370361328125, 1.1071624755859375, 1.16595458984375, 1.2247467041015625, 1.283538818359375, 1.3423309326171875, 1.401123046875, 1.4599151611328125, 1.518707275390625, 1.5774993896484375, 1.63629150390625, 1.6950836181640625, 1.753875732421875, 1.8126678466796875, 1.8714599609375, 1.9302520751953125, 1.989044189453125, 2.0478363037109375, 2.10662841796875, 2.1654205322265625, 2.224212646484375, 2.2830047607421875, 2.341796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 5.0, 8.0, 5.0, 11.0, 12.0, 23.0, 22.0, 31.0, 53.0, 64.0, 74.0, 100.0, 157.0, 268.0, 445.0, 984.0, 3913.0, 30603.0, 445018.0, 523953.0, 35686.0, 4715.0, 1091.0, 402.0, 264.0, 172.0, 125.0, 94.0, 69.0, 37.0, 23.0, 24.0, 19.0, 12.0, 15.0, 12.0, 7.0, 5.0, 6.0, 3.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.237060546875, -0.2296600341796875, -0.222259521484375, -0.2148590087890625, -0.20745849609375, -0.2000579833984375, -0.192657470703125, -0.1852569580078125, -0.1778564453125, -0.1704559326171875, -0.163055419921875, -0.1556549072265625, -0.14825439453125, -0.1408538818359375, -0.133453369140625, -0.1260528564453125, -0.11865234375, -0.1112518310546875, -0.103851318359375, -0.0964508056640625, -0.08905029296875, -0.0816497802734375, -0.074249267578125, -0.0668487548828125, -0.0594482421875, -0.0520477294921875, -0.044647216796875, -0.0372467041015625, -0.02984619140625, -0.0224456787109375, -0.015045166015625, -0.0076446533203125, -0.000244140625, 0.0071563720703125, 0.014556884765625, 0.0219573974609375, 0.02935791015625, 0.0367584228515625, 0.044158935546875, 0.0515594482421875, 0.0589599609375, 0.0663604736328125, 0.073760986328125, 0.0811614990234375, 0.08856201171875, 0.0959625244140625, 0.103363037109375, 0.1107635498046875, 0.1181640625, 0.1255645751953125, 0.132965087890625, 0.1403656005859375, 0.14776611328125, 0.1551666259765625, 0.162567138671875, 0.1699676513671875, 0.1773681640625, 0.1847686767578125, 0.192169189453125, 0.1995697021484375, 0.20697021484375, 0.2143707275390625, 0.221771240234375, 0.2291717529296875, 0.236572265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 6.0, 5.0, 3.0, 17.0, 14.0, 10.0, 23.0, 23.0, 20.0, 29.0, 27.0, 27.0, 31.0, 37.0, 37.0, 45.0, 45.0, 35.0, 50.0, 43.0, 42.0, 49.0, 33.0, 36.0, 48.0, 42.0, 29.0, 26.0, 20.0, 19.0, 23.0, 19.0, 9.0, 9.0, 11.0, 4.0, 13.0, 5.0, 8.0, 6.0, 8.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.32421875, -2.24969482421875, -2.1751708984375, -2.10064697265625, -2.026123046875, -1.95159912109375, -1.8770751953125, -1.80255126953125, -1.72802734375, -1.65350341796875, -1.5789794921875, -1.50445556640625, -1.429931640625, -1.35540771484375, -1.2808837890625, -1.20635986328125, -1.1318359375, -1.05731201171875, -0.9827880859375, -0.90826416015625, -0.833740234375, -0.75921630859375, -0.6846923828125, -0.61016845703125, -0.53564453125, -0.46112060546875, -0.3865966796875, -0.31207275390625, -0.237548828125, -0.16302490234375, -0.0885009765625, -0.01397705078125, 0.060546875, 0.13507080078125, 0.2095947265625, 0.28411865234375, 0.358642578125, 0.43316650390625, 0.5076904296875, 0.58221435546875, 0.65673828125, 0.73126220703125, 0.8057861328125, 0.88031005859375, 0.954833984375, 1.02935791015625, 1.1038818359375, 1.17840576171875, 1.2529296875, 1.32745361328125, 1.4019775390625, 1.47650146484375, 1.551025390625, 1.62554931640625, 1.7000732421875, 1.77459716796875, 1.84912109375, 1.92364501953125, 1.9981689453125, 2.07269287109375, 2.147216796875, 2.22174072265625, 2.2962646484375, 2.37078857421875, 2.4453125]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 5.0, 0.0, 1.0, 4.0, 2.0, 4.0, 5.0, 9.0, 10.0, 17.0, 22.0, 47.0, 54.0, 79.0, 144.0, 251.0, 587.0, 2457.0, 745711.0, 295746.0, 2235.0, 550.0, 245.0, 132.0, 84.0, 47.0, 41.0, 25.0, 16.0, 8.0, 11.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.093505859375, -0.09075260162353516, -0.08799934387207031, -0.08524608612060547, -0.08249282836914062, -0.07973957061767578, -0.07698631286621094, -0.0742330551147461, -0.07147979736328125, -0.0687265396118164, -0.06597328186035156, -0.06322002410888672, -0.060466766357421875, -0.05771350860595703, -0.05496025085449219, -0.052206993103027344, -0.0494537353515625, -0.046700477600097656, -0.04394721984863281, -0.04119396209716797, -0.038440704345703125, -0.03568744659423828, -0.03293418884277344, -0.030180931091308594, -0.02742767333984375, -0.024674415588378906, -0.021921157836914062, -0.01916790008544922, -0.016414642333984375, -0.013661384582519531, -0.010908126831054688, -0.008154869079589844, -0.005401611328125, -0.0026483535766601562, 0.0001049041748046875, 0.0028581619262695312, 0.005611419677734375, 0.008364677429199219, 0.011117935180664062, 0.013871192932128906, 0.01662445068359375, 0.019377708435058594, 0.022130966186523438, 0.02488422393798828, 0.027637481689453125, 0.03039073944091797, 0.03314399719238281, 0.035897254943847656, 0.0386505126953125, 0.041403770446777344, 0.04415702819824219, 0.04691028594970703, 0.049663543701171875, 0.05241680145263672, 0.05517005920410156, 0.057923316955566406, 0.06067657470703125, 0.0634298324584961, 0.06618309020996094, 0.06893634796142578, 0.07168960571289062, 0.07444286346435547, 0.07719612121582031, 0.07994937896728516, 0.08270263671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 6.0, 5.0, 11.0, 13.0, 4.0, 18.0, 21.0, 32.0, 31.0, 55.0, 48.0, 80.0, 83.0, 84.0, 85.0, 72.0, 74.0, 48.0, 54.0, 33.0, 35.0, 24.0, 16.0, 14.0, 8.0, 9.0, 8.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.609325408935547e-05, -1.5635043382644653e-05, -1.5176832675933838e-05, -1.4718621969223022e-05, -1.4260411262512207e-05, -1.3802200555801392e-05, -1.3343989849090576e-05, -1.288577914237976e-05, -1.2427568435668945e-05, -1.196935772895813e-05, -1.1511147022247314e-05, -1.1052936315536499e-05, -1.0594725608825684e-05, -1.0136514902114868e-05, -9.678304195404053e-06, -9.220093488693237e-06, -8.761882781982422e-06, -8.303672075271606e-06, -7.845461368560791e-06, -7.387250661849976e-06, -6.92903995513916e-06, -6.470829248428345e-06, -6.012618541717529e-06, -5.554407835006714e-06, -5.0961971282958984e-06, -4.637986421585083e-06, -4.179775714874268e-06, -3.721565008163452e-06, -3.2633543014526367e-06, -2.8051435947418213e-06, -2.346932888031006e-06, -1.8887221813201904e-06, -1.430511474609375e-06, -9.723007678985596e-07, -5.140900611877441e-07, -5.587935447692871e-08, 4.023313522338867e-07, 8.605420589447021e-07, 1.3187527656555176e-06, 1.776963472366333e-06, 2.2351741790771484e-06, 2.693384885787964e-06, 3.1515955924987793e-06, 3.6098062992095947e-06, 4.06801700592041e-06, 4.526227712631226e-06, 4.984438419342041e-06, 5.4426491260528564e-06, 5.900859832763672e-06, 6.359070539474487e-06, 6.817281246185303e-06, 7.275491952896118e-06, 7.733702659606934e-06, 8.191913366317749e-06, 8.650124073028564e-06, 9.10833477973938e-06, 9.566545486450195e-06, 1.002475619316101e-05, 1.0482966899871826e-05, 1.0941177606582642e-05, 1.1399388313293457e-05, 1.1857599020004272e-05, 1.2315809726715088e-05, 1.2774020433425903e-05, 1.3232231140136719e-05]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 0.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 6.0, 10.0, 15.0, 21.0, 32.0, 45.0, 95.0, 168.0, 268.0, 528.0, 1244.0, 3449.0, 14183.0, 154093.0, 834176.0, 30694.0, 5986.0, 1862.0, 778.0, 377.0, 207.0, 113.0, 71.0, 33.0, 27.0, 18.0, 8.0, 9.0, 4.0, 7.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08190536499023438, -0.07964324951171875, -0.07738113403320312, -0.0751190185546875, -0.07285690307617188, -0.07059478759765625, -0.06833267211914062, -0.066070556640625, -0.06380844116210938, -0.06154632568359375, -0.059284210205078125, -0.0570220947265625, -0.054759979248046875, -0.05249786376953125, -0.050235748291015625, -0.0479736328125, -0.045711517333984375, -0.04344940185546875, -0.041187286376953125, -0.0389251708984375, -0.036663055419921875, -0.03440093994140625, -0.032138824462890625, -0.029876708984375, -0.027614593505859375, -0.02535247802734375, -0.023090362548828125, -0.0208282470703125, -0.018566131591796875, -0.01630401611328125, -0.014041900634765625, -0.01177978515625, -0.009517669677734375, -0.00725555419921875, -0.004993438720703125, -0.0027313232421875, -0.000469207763671875, 0.00179290771484375, 0.004055023193359375, 0.006317138671875, 0.008579254150390625, 0.01084136962890625, 0.013103485107421875, 0.0153656005859375, 0.017627716064453125, 0.01988983154296875, 0.022151947021484375, 0.0244140625, 0.026676177978515625, 0.02893829345703125, 0.031200408935546875, 0.0334625244140625, 0.035724639892578125, 0.03798675537109375, 0.040248870849609375, 0.042510986328125, 0.044773101806640625, 0.04703521728515625, 0.049297332763671875, 0.0515594482421875, 0.053821563720703125, 0.05608367919921875, 0.058345794677734375, 0.06060791015625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 9.0, 16.0, 25.0, 44.0, 95.0, 302.0, 284.0, 76.0, 45.0, 22.0, 14.0, 17.0, 9.0, 7.0, 4.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.018341064453125, -0.017661094665527344, -0.016981124877929688, -0.01630115509033203, -0.015621185302734375, -0.014941215515136719, -0.014261245727539062, -0.013581275939941406, -0.01290130615234375, -0.012221336364746094, -0.011541366577148438, -0.010861396789550781, -0.010181427001953125, -0.009501457214355469, -0.008821487426757812, -0.008141517639160156, -0.0074615478515625, -0.006781578063964844, -0.0061016082763671875, -0.005421638488769531, -0.004741668701171875, -0.004061698913574219, -0.0033817291259765625, -0.0027017593383789062, -0.00202178955078125, -0.0013418197631835938, -0.0006618499755859375, 1.811981201171875e-05, 0.000698089599609375, 0.0013780593872070312, 0.0020580291748046875, 0.0027379989624023438, 0.00341796875, 0.004097938537597656, 0.0047779083251953125, 0.005457878112792969, 0.006137847900390625, 0.006817817687988281, 0.0074977874755859375, 0.008177757263183594, 0.00885772705078125, 0.009537696838378906, 0.010217666625976562, 0.010897636413574219, 0.011577606201171875, 0.012257575988769531, 0.012937545776367188, 0.013617515563964844, 0.0142974853515625, 0.014977455139160156, 0.015657424926757812, 0.01633739471435547, 0.017017364501953125, 0.01769733428955078, 0.018377304077148438, 0.019057273864746094, 0.01973724365234375, 0.020417213439941406, 0.021097183227539062, 0.02177715301513672, 0.022457122802734375, 0.02313709259033203, 0.023817062377929688, 0.024497032165527344, 0.025177001953125]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 11.0, 10.0, 26.0, 40.0, 90.0, 160.0, 200.0, 183.0, 150.0, 65.0, 29.0, 15.0, 14.0, 4.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3721532821655273, -3.2513275146484375, -3.1305019855499268, -3.009676218032837, -2.888850450515747, -2.7680249214172363, -2.6471991539001465, -2.5263733863830566, -2.405547618865967, -2.284721851348877, -2.163896322250366, -2.0430705547332764, -1.9222447872161865, -1.8014191389083862, -1.680593490600586, -1.559767723083496, -1.4389420747756958, -1.3181164264678955, -1.1972906589508057, -1.0764650106430054, -0.9556392431259155, -0.8348135948181152, -0.7139878869056702, -0.5931621789932251, -0.47233647108078003, -0.35151076316833496, -0.2306850701570511, -0.10985937714576721, 0.010966330766677856, 0.13179200887680054, 0.2526177167892456, 0.3734434247016907, 0.49426913261413574, 0.6150948405265808, 0.7359205484390259, 0.8567461967468262, 0.977571964263916, 1.0983976125717163, 1.2192232608795166, 1.3400490283966064, 1.4608747959136963, 1.5817004442214966, 1.7025262117385864, 1.8233518600463867, 1.9441776275634766, 2.0650033950805664, 2.185828924179077, 2.306654691696167, 2.4274802207946777, 2.5483059883117676, 2.6691315174102783, 2.789957284927368, 2.910783052444458, 3.0316085815429688, 3.1524343490600586, 3.2732601165771484, 3.3940858840942383, 3.514911651611328, 3.635737180709839, 3.7565629482269287, 3.8773887157440186, 3.9982142448425293, 4.119040012359619, 4.239865779876709, 4.360691547393799]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 7.0, 8.0, 11.0, 10.0, 19.0, 25.0, 31.0, 42.0, 43.0, 71.0, 59.0, 73.0, 80.0, 89.0, 78.0, 66.0, 68.0, 46.0, 42.0, 41.0, 28.0, 19.0, 16.0, 10.0, 6.0, 5.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2674089670181274, -1.2077746391296387, -1.1481401920318604, -1.0885058641433716, -1.0288715362548828, -0.969237208366394, -0.9096028208732605, -0.849968433380127, -0.7903341054916382, -0.7306997776031494, -0.6710653901100159, -0.6114310026168823, -0.5517966747283936, -0.4921623170375824, -0.43252795934677124, -0.3728936016559601, -0.3132592439651489, -0.25362488627433777, -0.1939905285835266, -0.13435617089271545, -0.0747218132019043, -0.01508745551109314, 0.04454690217971802, 0.10418125987052917, 0.16381561756134033, 0.2234499752521515, 0.28308433294296265, 0.3427186906337738, 0.40235304832458496, 0.4619874060153961, 0.5216217637062073, 0.5812561511993408, 0.64089035987854, 0.7005246877670288, 0.7601590752601624, 0.8197934627532959, 0.8794277906417847, 0.9390621185302734, 0.998696506023407, 1.0583308935165405, 1.1179652214050293, 1.177599549293518, 1.2372338771820068, 1.2968683242797852, 1.356502652168274, 1.4161369800567627, 1.475771427154541, 1.5354057550430298, 1.5950400829315186, 1.6546744108200073, 1.714308738708496, 1.7739431858062744, 1.8335775136947632, 1.893211841583252, 1.9528462886810303, 2.0124804973602295, 2.072114944458008, 2.131749391555786, 2.1913836002349854, 2.2510180473327637, 2.310652256011963, 2.370286703109741, 2.4299211502075195, 2.4895553588867188, 2.549189805984497]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 12.0, 12.0, 16.0, 27.0, 39.0, 59.0, 104.0, 189.0, 332.0, 623.0, 1203.0, 2634.0, 6313.0, 18643.0, 78836.0, 616603.0, 261881.0, 41115.0, 11555.0, 4319.0, 1895.0, 972.0, 513.0, 234.0, 160.0, 89.0, 52.0, 34.0, 24.0, 13.0, 19.0, 8.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2578125, -1.21087646484375, -1.1639404296875, -1.11700439453125, -1.070068359375, -1.02313232421875, -0.9761962890625, -0.92926025390625, -0.88232421875, -0.83538818359375, -0.7884521484375, -0.74151611328125, -0.694580078125, -0.64764404296875, -0.6007080078125, -0.55377197265625, -0.5068359375, -0.45989990234375, -0.4129638671875, -0.36602783203125, -0.319091796875, -0.27215576171875, -0.2252197265625, -0.17828369140625, -0.13134765625, -0.08441162109375, -0.0374755859375, 0.00946044921875, 0.056396484375, 0.10333251953125, 0.1502685546875, 0.19720458984375, 0.244140625, 0.29107666015625, 0.3380126953125, 0.38494873046875, 0.431884765625, 0.47882080078125, 0.5257568359375, 0.57269287109375, 0.61962890625, 0.66656494140625, 0.7135009765625, 0.76043701171875, 0.807373046875, 0.85430908203125, 0.9012451171875, 0.94818115234375, 0.9951171875, 1.04205322265625, 1.0889892578125, 1.13592529296875, 1.182861328125, 1.22979736328125, 1.2767333984375, 1.32366943359375, 1.37060546875, 1.41754150390625, 1.4644775390625, 1.51141357421875, 1.558349609375, 1.60528564453125, 1.6522216796875, 1.69915771484375, 1.74609375]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 6.0, 7.0, 13.0, 14.0, 22.0, 35.0, 45.0, 49.0, 49.0, 57.0, 80.0, 82.0, 82.0, 80.0, 85.0, 45.0, 63.0, 49.0, 32.0, 23.0, 18.0, 15.0, 15.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.76953125, -2.65142822265625, -2.5333251953125, -2.41522216796875, -2.297119140625, -2.17901611328125, -2.0609130859375, -1.94281005859375, -1.82470703125, -1.70660400390625, -1.5885009765625, -1.47039794921875, -1.352294921875, -1.23419189453125, -1.1160888671875, -0.99798583984375, -0.8798828125, -0.76177978515625, -0.6436767578125, -0.52557373046875, -0.407470703125, -0.28936767578125, -0.1712646484375, -0.05316162109375, 0.06494140625, 0.18304443359375, 0.3011474609375, 0.41925048828125, 0.537353515625, 0.65545654296875, 0.7735595703125, 0.89166259765625, 1.009765625, 1.12786865234375, 1.2459716796875, 1.36407470703125, 1.482177734375, 1.60028076171875, 1.7183837890625, 1.83648681640625, 1.95458984375, 2.07269287109375, 2.1907958984375, 2.30889892578125, 2.427001953125, 2.54510498046875, 2.6632080078125, 2.78131103515625, 2.8994140625, 3.01751708984375, 3.1356201171875, 3.25372314453125, 3.371826171875, 3.48992919921875, 3.6080322265625, 3.72613525390625, 3.84423828125, 3.96234130859375, 4.0804443359375, 4.19854736328125, 4.316650390625, 4.43475341796875, 4.5528564453125, 4.67095947265625, 4.7890625]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 11.0, 7.0, 7.0, 10.0, 22.0, 14.0, 29.0, 27.0, 36.0, 48.0, 72.0, 100.0, 175.0, 359.0, 1380.0, 14634.0, 929708.0, 96949.0, 3598.0, 639.0, 215.0, 157.0, 96.0, 57.0, 47.0, 31.0, 25.0, 22.0, 19.0, 10.0, 11.0, 7.0, 3.0, 8.0, 5.0, 0.0, 4.0, 3.0, 3.0, 1.0, 4.0, 2.0], "bins": [-5.64453125, -5.49884033203125, -5.3531494140625, -5.20745849609375, -5.061767578125, -4.91607666015625, -4.7703857421875, -4.62469482421875, -4.47900390625, -4.33331298828125, -4.1876220703125, -4.04193115234375, -3.896240234375, -3.75054931640625, -3.6048583984375, -3.45916748046875, -3.3134765625, -3.16778564453125, -3.0220947265625, -2.87640380859375, -2.730712890625, -2.58502197265625, -2.4393310546875, -2.29364013671875, -2.14794921875, -2.00225830078125, -1.8565673828125, -1.71087646484375, -1.565185546875, -1.41949462890625, -1.2738037109375, -1.12811279296875, -0.982421875, -0.83673095703125, -0.6910400390625, -0.54534912109375, -0.399658203125, -0.25396728515625, -0.1082763671875, 0.03741455078125, 0.18310546875, 0.32879638671875, 0.4744873046875, 0.62017822265625, 0.765869140625, 0.91156005859375, 1.0572509765625, 1.20294189453125, 1.3486328125, 1.49432373046875, 1.6400146484375, 1.78570556640625, 1.931396484375, 2.07708740234375, 2.2227783203125, 2.36846923828125, 2.51416015625, 2.65985107421875, 2.8055419921875, 2.95123291015625, 3.096923828125, 3.24261474609375, 3.3883056640625, 3.53399658203125, 3.6796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 3.0, 5.0, 6.0, 8.0, 9.0, 11.0, 9.0, 16.0, 24.0, 24.0, 19.0, 23.0, 36.0, 40.0, 39.0, 48.0, 47.0, 42.0, 49.0, 59.0, 36.0, 51.0, 57.0, 39.0, 32.0, 38.0, 32.0, 35.0, 19.0, 19.0, 27.0, 18.0, 15.0, 16.0, 7.0, 8.0, 4.0, 3.0, 7.0, 5.0, 3.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0], "bins": [-3.86328125, -3.758331298828125, -3.65338134765625, -3.548431396484375, -3.4434814453125, -3.338531494140625, -3.23358154296875, -3.128631591796875, -3.023681640625, -2.918731689453125, -2.81378173828125, -2.708831787109375, -2.6038818359375, -2.498931884765625, -2.39398193359375, -2.289031982421875, -2.18408203125, -2.079132080078125, -1.97418212890625, -1.869232177734375, -1.7642822265625, -1.659332275390625, -1.55438232421875, -1.449432373046875, -1.344482421875, -1.239532470703125, -1.13458251953125, -1.029632568359375, -0.9246826171875, -0.819732666015625, -0.71478271484375, -0.609832763671875, -0.5048828125, -0.399932861328125, -0.29498291015625, -0.190032958984375, -0.0850830078125, 0.019866943359375, 0.12481689453125, 0.229766845703125, 0.334716796875, 0.439666748046875, 0.54461669921875, 0.649566650390625, 0.7545166015625, 0.859466552734375, 0.96441650390625, 1.069366455078125, 1.17431640625, 1.279266357421875, 1.38421630859375, 1.489166259765625, 1.5941162109375, 1.699066162109375, 1.80401611328125, 1.908966064453125, 2.013916015625, 2.118865966796875, 2.22381591796875, 2.328765869140625, 2.4337158203125, 2.538665771484375, 2.64361572265625, 2.748565673828125, 2.853515625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 2.0, 5.0, 5.0, 6.0, 7.0, 9.0, 13.0, 15.0, 21.0, 31.0, 48.0, 66.0, 120.0, 199.0, 390.0, 1222.0, 5085.0, 35100.0, 727144.0, 254676.0, 19467.0, 3258.0, 844.0, 357.0, 179.0, 95.0, 47.0, 35.0, 27.0, 20.0, 14.0, 14.0, 5.0, 5.0, 5.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.0439453125, -1.0139999389648438, -0.9840545654296875, -0.9541091918945312, -0.924163818359375, -0.8942184448242188, -0.8642730712890625, -0.8343276977539062, -0.80438232421875, -0.7744369506835938, -0.7444915771484375, -0.7145462036132812, -0.684600830078125, -0.6546554565429688, -0.6247100830078125, -0.5947647094726562, -0.5648193359375, -0.5348739624023438, -0.5049285888671875, -0.47498321533203125, -0.445037841796875, -0.41509246826171875, -0.3851470947265625, -0.35520172119140625, -0.32525634765625, -0.29531097412109375, -0.2653656005859375, -0.23542022705078125, -0.205474853515625, -0.17552947998046875, -0.1455841064453125, -0.11563873291015625, -0.085693359375, -0.05574798583984375, -0.0258026123046875, 0.00414276123046875, 0.034088134765625, 0.06403350830078125, 0.0939788818359375, 0.12392425537109375, 0.15386962890625, 0.18381500244140625, 0.2137603759765625, 0.24370574951171875, 0.273651123046875, 0.30359649658203125, 0.3335418701171875, 0.36348724365234375, 0.3934326171875, 0.42337799072265625, 0.4533233642578125, 0.48326873779296875, 0.513214111328125, 0.5431594848632812, 0.5731048583984375, 0.6030502319335938, 0.63299560546875, 0.6629409790039062, 0.6928863525390625, 0.7228317260742188, 0.752777099609375, 0.7827224731445312, 0.8126678466796875, 0.8426132202148438, 0.87255859375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 5.0, 16.0, 19.0, 27.0, 49.0, 112.0, 344.0, 235.0, 98.0, 38.0, 27.0, 14.0, 10.0, 7.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002760887145996094, -0.00026978179812431335, -0.00026347488164901733, -0.0002571679651737213, -0.0002508610486984253, -0.00024455413222312927, -0.00023824721574783325, -0.00023194029927253723, -0.0002256333827972412, -0.0002193264663219452, -0.00021301954984664917, -0.00020671263337135315, -0.00020040571689605713, -0.0001940988004207611, -0.0001877918839454651, -0.00018148496747016907, -0.00017517805099487305, -0.00016887113451957703, -0.000162564218044281, -0.00015625730156898499, -0.00014995038509368896, -0.00014364346861839294, -0.00013733655214309692, -0.0001310296356678009, -0.00012472271919250488, -0.00011841580271720886, -0.00011210888624191284, -0.00010580196976661682, -9.94950532913208e-05, -9.318813681602478e-05, -8.688122034072876e-05, -8.057430386543274e-05, -7.426738739013672e-05, -6.79604709148407e-05, -6.165355443954468e-05, -5.534663796424866e-05, -4.903972148895264e-05, -4.2732805013656616e-05, -3.6425888538360596e-05, -3.0118972063064575e-05, -2.3812055587768555e-05, -1.7505139112472534e-05, -1.1198222637176514e-05, -4.891306161880493e-06, 1.4156103134155273e-06, 7.722526788711548e-06, 1.4029443264007568e-05, 2.033635973930359e-05, 2.664327621459961e-05, 3.295019268989563e-05, 3.925710916519165e-05, 4.556402564048767e-05, 5.187094211578369e-05, 5.817785859107971e-05, 6.448477506637573e-05, 7.079169154167175e-05, 7.709860801696777e-05, 8.34055244922638e-05, 8.971244096755981e-05, 9.601935744285583e-05, 0.00010232627391815186, 0.00010863319039344788, 0.0001149401068687439, 0.00012124702334403992, 0.00012755393981933594]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 10.0, 4.0, 17.0, 28.0, 26.0, 51.0, 74.0, 127.0, 210.0, 384.0, 865.0, 2052.0, 5369.0, 16789.0, 67644.0, 608188.0, 282141.0, 45135.0, 12299.0, 4038.0, 1563.0, 693.0, 345.0, 197.0, 91.0, 66.0, 41.0, 27.0, 25.0, 10.0, 12.0, 1.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.53173828125, -0.5126571655273438, -0.4935760498046875, -0.47449493408203125, -0.455413818359375, -0.43633270263671875, -0.4172515869140625, -0.39817047119140625, -0.37908935546875, -0.36000823974609375, -0.3409271240234375, -0.32184600830078125, -0.302764892578125, -0.28368377685546875, -0.2646026611328125, -0.24552154541015625, -0.2264404296875, -0.20735931396484375, -0.1882781982421875, -0.16919708251953125, -0.150115966796875, -0.13103485107421875, -0.1119537353515625, -0.09287261962890625, -0.07379150390625, -0.05471038818359375, -0.0356292724609375, -0.01654815673828125, 0.002532958984375, 0.02161407470703125, 0.0406951904296875, 0.05977630615234375, 0.078857421875, 0.09793853759765625, 0.1170196533203125, 0.13610076904296875, 0.155181884765625, 0.17426300048828125, 0.1933441162109375, 0.21242523193359375, 0.23150634765625, 0.25058746337890625, 0.2696685791015625, 0.28874969482421875, 0.307830810546875, 0.32691192626953125, 0.3459930419921875, 0.36507415771484375, 0.3841552734375, 0.40323638916015625, 0.4223175048828125, 0.44139862060546875, 0.460479736328125, 0.47956085205078125, 0.4986419677734375, 0.5177230834960938, 0.53680419921875, 0.5558853149414062, 0.5749664306640625, 0.5940475463867188, 0.613128662109375, 0.6322097778320312, 0.6512908935546875, 0.6703720092773438, 0.689453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 6.0, 5.0, 5.0, 6.0, 13.0, 15.0, 25.0, 22.0, 40.0, 52.0, 80.0, 141.0, 234.0, 119.0, 68.0, 42.0, 38.0, 20.0, 17.0, 18.0, 12.0, 10.0, 8.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.412353515625, -0.40128326416015625, -0.3902130126953125, -0.37914276123046875, -0.368072509765625, -0.35700225830078125, -0.3459320068359375, -0.33486175537109375, -0.32379150390625, -0.31272125244140625, -0.3016510009765625, -0.29058074951171875, -0.279510498046875, -0.26844024658203125, -0.2573699951171875, -0.24629974365234375, -0.2352294921875, -0.22415924072265625, -0.2130889892578125, -0.20201873779296875, -0.190948486328125, -0.17987823486328125, -0.1688079833984375, -0.15773773193359375, -0.14666748046875, -0.13559722900390625, -0.1245269775390625, -0.11345672607421875, -0.102386474609375, -0.09131622314453125, -0.0802459716796875, -0.06917572021484375, -0.05810546875, -0.04703521728515625, -0.0359649658203125, -0.02489471435546875, -0.013824462890625, -0.00275421142578125, 0.0083160400390625, 0.01938629150390625, 0.03045654296875, 0.04152679443359375, 0.0525970458984375, 0.06366729736328125, 0.074737548828125, 0.08580780029296875, 0.0968780517578125, 0.10794830322265625, 0.1190185546875, 0.13008880615234375, 0.1411590576171875, 0.15222930908203125, 0.163299560546875, 0.17436981201171875, 0.1854400634765625, 0.19651031494140625, 0.20758056640625, 0.21865081787109375, 0.2297210693359375, 0.24079132080078125, 0.251861572265625, 0.26293182373046875, 0.2740020751953125, 0.28507232666015625, 0.296142578125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 4.0, 32.0, 100.0, 293.0, 351.0, 159.0, 45.0, 16.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.670278072357178, -6.201328754425049, -5.73237943649292, -5.263430595397949, -4.79448127746582, -4.325531959533691, -3.8565826416015625, -3.3876333236694336, -2.9186840057373047, -2.449734687805176, -1.9807854890823364, -1.511836290359497, -1.0428869724273682, -0.5739376544952393, -0.10498857498168945, 0.36396074295043945, 0.8329100608825684, 1.3018593788146973, 1.7708085775375366, 2.239757776260376, 2.708707094192505, 3.177656412124634, 3.6466054916381836, 4.1155548095703125, 4.584504127502441, 5.05345344543457, 5.522402763366699, 5.991352081298828, 6.460301399230957, 6.929250717163086, 7.398199558258057, 7.8671488761901855, 8.336097717285156, 8.805047035217285, 9.273996353149414, 9.742945671081543, 10.211894989013672, 10.6808443069458, 11.14979362487793, 11.618741989135742, 12.087692260742188, 12.556641578674316, 13.025590896606445, 13.494540214538574, 13.963489532470703, 14.432438850402832, 14.901388168334961, 15.370336532592773, 15.839285850524902, 16.30823516845703, 16.777183532714844, 17.24613380432129, 17.7150821685791, 18.184032440185547, 18.65298080444336, 19.121931076049805, 19.590879440307617, 20.05982780456543, 20.528778076171875, 20.997726440429688, 21.466676712036133, 21.935625076293945, 22.40457534790039, 22.873523712158203, 23.34247398376465]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 2.0, 5.0, 3.0, 11.0, 10.0, 10.0, 24.0, 26.0, 24.0, 33.0, 27.0, 18.0, 45.0, 32.0, 48.0, 41.0, 36.0, 43.0, 48.0, 52.0, 49.0, 47.0, 34.0, 42.0, 27.0, 37.0, 47.0, 29.0, 16.0, 21.0, 22.0, 20.0, 18.0, 9.0, 10.0, 9.0, 5.0, 4.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.781528949737549, -4.603460788726807, -4.425393104553223, -4.2473249435424805, -4.069256782531738, -3.8911890983581543, -3.713120937347412, -3.535053014755249, -3.356985092163086, -3.178917169570923, -3.0008490085601807, -2.8227810859680176, -2.6447131633758545, -2.4666452407836914, -2.288577079772949, -2.110509157180786, -1.932440996170044, -1.7543729543685913, -1.5763050317764282, -1.3982369899749756, -1.2201690673828125, -1.0421010255813599, -0.8640329837799072, -0.6859650611877441, -0.5078970193862915, -0.32982903718948364, -0.1517610251903534, 0.026306986808776855, 0.20437496900558472, 0.3824429512023926, 0.5605109930038452, 0.7385789155960083, 0.9166469573974609, 1.0947149991989136, 1.2727829217910767, 1.4508509635925293, 1.6289188861846924, 1.806986927986145, 1.9850549697875977, 2.1631228923797607, 2.341190814971924, 2.519258737564087, 2.697326898574829, 2.875394821166992, 3.0534627437591553, 3.2315306663513184, 3.4095988273620605, 3.5876667499542236, 3.765734910964966, 3.943802833557129, 4.121870994567871, 4.299939155578613, 4.478006839752197, 4.6560750007629395, 4.834142684936523, 5.012210845947266, 5.190279006958008, 5.36834716796875, 5.546414852142334, 5.724483013153076, 5.902551174163818, 6.080618858337402, 6.2586870193481445, 6.436755180358887, 6.614822864532471]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 15.0, 13.0, 23.0, 21.0, 24.0, 31.0, 44.0, 57.0, 84.0, 127.0, 158.0, 253.0, 355.0, 515.0, 951.0, 1815.0, 3513.0, 8597.0, 25557.0, 116232.0, 1669861.0, 2187792.0, 134549.0, 26826.0, 8538.0, 3703.0, 1689.0, 965.0, 585.0, 393.0, 260.0, 180.0, 110.0, 104.0, 86.0, 59.0, 43.0, 38.0, 36.0, 18.0, 15.0, 10.0, 15.0, 9.0, 5.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.046875, -1.973876953125, -1.90087890625, -1.827880859375, -1.7548828125, -1.681884765625, -1.60888671875, -1.535888671875, -1.462890625, -1.389892578125, -1.31689453125, -1.243896484375, -1.1708984375, -1.097900390625, -1.02490234375, -0.951904296875, -0.87890625, -0.805908203125, -0.73291015625, -0.659912109375, -0.5869140625, -0.513916015625, -0.44091796875, -0.367919921875, -0.294921875, -0.221923828125, -0.14892578125, -0.075927734375, -0.0029296875, 0.070068359375, 0.14306640625, 0.216064453125, 0.2890625, 0.362060546875, 0.43505859375, 0.508056640625, 0.5810546875, 0.654052734375, 0.72705078125, 0.800048828125, 0.873046875, 0.946044921875, 1.01904296875, 1.092041015625, 1.1650390625, 1.238037109375, 1.31103515625, 1.384033203125, 1.45703125, 1.530029296875, 1.60302734375, 1.676025390625, 1.7490234375, 1.822021484375, 1.89501953125, 1.968017578125, 2.041015625, 2.114013671875, 2.18701171875, 2.260009765625, 2.3330078125, 2.406005859375, 2.47900390625, 2.552001953125, 2.625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 7.0, 9.0, 12.0, 17.0, 18.0, 45.0, 42.0, 41.0, 64.0, 98.0, 90.0, 100.0, 107.0, 78.0, 75.0, 48.0, 47.0, 24.0, 29.0, 19.0, 11.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.322265625, -1.254669189453125, -1.18707275390625, -1.119476318359375, -1.0518798828125, -0.984283447265625, -0.91668701171875, -0.849090576171875, -0.781494140625, -0.713897705078125, -0.64630126953125, -0.578704833984375, -0.5111083984375, -0.443511962890625, -0.37591552734375, -0.308319091796875, -0.24072265625, -0.173126220703125, -0.10552978515625, -0.037933349609375, 0.0296630859375, 0.097259521484375, 0.16485595703125, 0.232452392578125, 0.300048828125, 0.367645263671875, 0.43524169921875, 0.502838134765625, 0.5704345703125, 0.638031005859375, 0.70562744140625, 0.773223876953125, 0.8408203125, 0.908416748046875, 0.97601318359375, 1.043609619140625, 1.1112060546875, 1.178802490234375, 1.24639892578125, 1.313995361328125, 1.381591796875, 1.449188232421875, 1.51678466796875, 1.584381103515625, 1.6519775390625, 1.719573974609375, 1.78717041015625, 1.854766845703125, 1.92236328125, 1.989959716796875, 2.05755615234375, 2.125152587890625, 2.1927490234375, 2.260345458984375, 2.32794189453125, 2.395538330078125, 2.463134765625, 2.530731201171875, 2.59832763671875, 2.665924072265625, 2.7335205078125, 2.801116943359375, 2.86871337890625, 2.936309814453125, 3.00390625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 6.0, 6.0, 7.0, 7.0, 21.0, 27.0, 62.0, 99.0, 143.0, 260.0, 582.0, 1286.0, 4037.0, 21820.0, 454698.0, 3614012.0, 84027.0, 9089.0, 2264.0, 941.0, 397.0, 207.0, 104.0, 64.0, 37.0, 21.0, 12.0, 10.0, 8.0, 3.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.91015625, -4.75311279296875, -4.5960693359375, -4.43902587890625, -4.281982421875, -4.12493896484375, -3.9678955078125, -3.81085205078125, -3.65380859375, -3.49676513671875, -3.3397216796875, -3.18267822265625, -3.025634765625, -2.86859130859375, -2.7115478515625, -2.55450439453125, -2.3974609375, -2.24041748046875, -2.0833740234375, -1.92633056640625, -1.769287109375, -1.61224365234375, -1.4552001953125, -1.29815673828125, -1.14111328125, -0.98406982421875, -0.8270263671875, -0.66998291015625, -0.512939453125, -0.35589599609375, -0.1988525390625, -0.04180908203125, 0.115234375, 0.27227783203125, 0.4293212890625, 0.58636474609375, 0.743408203125, 0.90045166015625, 1.0574951171875, 1.21453857421875, 1.37158203125, 1.52862548828125, 1.6856689453125, 1.84271240234375, 1.999755859375, 2.15679931640625, 2.3138427734375, 2.47088623046875, 2.6279296875, 2.78497314453125, 2.9420166015625, 3.09906005859375, 3.256103515625, 3.41314697265625, 3.5701904296875, 3.72723388671875, 3.88427734375, 4.04132080078125, 4.1983642578125, 4.35540771484375, 4.512451171875, 4.66949462890625, 4.8265380859375, 4.98358154296875, 5.140625]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 7.0, 17.0, 22.0, 31.0, 40.0, 70.0, 102.0, 160.0, 265.0, 541.0, 834.0, 776.0, 441.0, 277.0, 157.0, 117.0, 58.0, 47.0, 27.0, 24.0, 12.0, 10.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.0794525146484375, -1.048553466796875, -1.0176544189453125, -0.98675537109375, -0.9558563232421875, -0.924957275390625, -0.8940582275390625, -0.8631591796875, -0.8322601318359375, -0.801361083984375, -0.7704620361328125, -0.73956298828125, -0.7086639404296875, -0.677764892578125, -0.6468658447265625, -0.615966796875, -0.5850677490234375, -0.554168701171875, -0.5232696533203125, -0.49237060546875, -0.4614715576171875, -0.430572509765625, -0.3996734619140625, -0.3687744140625, -0.3378753662109375, -0.306976318359375, -0.2760772705078125, -0.24517822265625, -0.2142791748046875, -0.183380126953125, -0.1524810791015625, -0.12158203125, -0.0906829833984375, -0.059783935546875, -0.0288848876953125, 0.00201416015625, 0.0329132080078125, 0.063812255859375, 0.0947113037109375, 0.1256103515625, 0.1565093994140625, 0.187408447265625, 0.2183074951171875, 0.24920654296875, 0.2801055908203125, 0.311004638671875, 0.3419036865234375, 0.372802734375, 0.4037017822265625, 0.434600830078125, 0.4654998779296875, 0.49639892578125, 0.5272979736328125, 0.558197021484375, 0.5890960693359375, 0.6199951171875, 0.6508941650390625, 0.681793212890625, 0.7126922607421875, 0.74359130859375, 0.7744903564453125, 0.805389404296875, 0.8362884521484375, 0.8671875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 8.0, 9.0, 13.0, 20.0, 20.0, 25.0, 25.0, 52.0, 52.0, 60.0, 66.0, 80.0, 70.0, 71.0, 86.0, 68.0, 73.0, 49.0, 31.0, 25.0, 29.0, 16.0, 10.0, 7.0, 9.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.405890464782715, -2.3250732421875, -2.244256019592285, -2.1634387969970703, -2.0826215744018555, -2.0018043518066406, -1.9209871292114258, -1.840169906616211, -1.759352684020996, -1.6785354614257812, -1.5977182388305664, -1.5169010162353516, -1.4360837936401367, -1.3552665710449219, -1.274449348449707, -1.1936321258544922, -1.1128149032592773, -1.0319976806640625, -0.9511804580688477, -0.8703632354736328, -0.789546012878418, -0.7087287902832031, -0.6279115676879883, -0.5470943450927734, -0.4662771224975586, -0.38545989990234375, -0.3046426773071289, -0.22382545471191406, -0.14300823211669922, -0.062191009521484375, 0.01862621307373047, 0.09944343566894531, 0.18026089668273926, 0.2610781192779541, 0.34189534187316895, 0.4227125644683838, 0.5035297870635986, 0.5843470096588135, 0.6651642322540283, 0.7459814548492432, 0.826798677444458, 0.9076159000396729, 0.9884331226348877, 1.0692503452301025, 1.1500675678253174, 1.2308847904205322, 1.311702013015747, 1.392519235610962, 1.4733364582061768, 1.5541536808013916, 1.6349709033966064, 1.7157881259918213, 1.7966053485870361, 1.877422571182251, 1.9582397937774658, 2.0390570163726807, 2.1198742389678955, 2.2006914615631104, 2.281508684158325, 2.36232590675354, 2.443143129348755, 2.5239603519439697, 2.6047775745391846, 2.6855947971343994, 2.7664120197296143]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 8.0, 14.0, 20.0, 34.0, 33.0, 38.0, 56.0, 53.0, 57.0, 69.0, 71.0, 63.0, 56.0, 62.0, 71.0, 50.0, 54.0, 41.0, 40.0, 34.0, 24.0, 12.0, 11.0, 8.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.071363925933838, -1.985168695449829, -1.8989734649658203, -1.8127782344818115, -1.7265828847885132, -1.6403876543045044, -1.5541924238204956, -1.4679970741271973, -1.3818018436431885, -1.2956066131591797, -1.209411382675171, -1.123216152191162, -1.0370208024978638, -0.950825572013855, -0.8646303415298462, -0.7784350514411926, -0.6922398805618286, -0.6060446500778198, -0.5198493599891663, -0.43365412950515747, -0.3474588692188263, -0.2612636089324951, -0.17506837844848633, -0.08887308835983276, -0.0026778578758239746, 0.0835173949599266, 0.16971264779567719, 0.25590789318084717, 0.34210315346717834, 0.4282984137535095, 0.5144936442375183, 0.6006889343261719, 0.6868841648101807, 0.7730793952941895, 0.859274685382843, 0.9454699158668518, 1.0316652059555054, 1.1178604364395142, 1.204055666923523, 1.2902510166168213, 1.37644624710083, 1.4626414775848389, 1.5488367080688477, 1.6350319385528564, 1.7212272882461548, 1.8074225187301636, 1.8936177492141724, 1.9798130989074707, 2.0660080909729004, 2.152203321456909, 2.238398551940918, 2.3245937824249268, 2.4107890129089355, 2.4969844818115234, 2.583179473876953, 2.669374942779541, 2.75557017326355, 2.8417654037475586, 2.9279606342315674, 3.014155864715576, 3.100351095199585, 3.1865463256835938, 3.2727417945861816, 3.3589370250701904, 3.445132255554199]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 7.0, 8.0, 18.0, 29.0, 36.0, 54.0, 97.0, 183.0, 354.0, 885.0, 2959.0, 18904.0, 565457.0, 438939.0, 16394.0, 2645.0, 800.0, 354.0, 163.0, 102.0, 58.0, 35.0, 20.0, 17.0, 15.0, 5.0, 5.0, 5.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.355224609375, -0.3390541076660156, -0.32288360595703125, -0.3067131042480469, -0.2905426025390625, -0.2743721008300781, -0.25820159912109375, -0.24203109741210938, -0.225860595703125, -0.20969009399414062, -0.19351959228515625, -0.17734909057617188, -0.1611785888671875, -0.14500808715820312, -0.12883758544921875, -0.11266708374023438, -0.09649658203125, -0.08032608032226562, -0.06415557861328125, -0.047985076904296875, -0.0318145751953125, -0.015644073486328125, 0.00052642822265625, 0.016696929931640625, 0.032867431640625, 0.049037933349609375, 0.06520843505859375, 0.08137893676757812, 0.0975494384765625, 0.11371994018554688, 0.12989044189453125, 0.14606094360351562, 0.1622314453125, 0.17840194702148438, 0.19457244873046875, 0.21074295043945312, 0.2269134521484375, 0.24308395385742188, 0.25925445556640625, 0.2754249572753906, 0.291595458984375, 0.3077659606933594, 0.32393646240234375, 0.3401069641113281, 0.3562774658203125, 0.3724479675292969, 0.38861846923828125, 0.4047889709472656, 0.42095947265625, 0.4371299743652344, 0.45330047607421875, 0.4694709777832031, 0.4856414794921875, 0.5018119812011719, 0.5179824829101562, 0.5341529846191406, 0.550323486328125, 0.5664939880371094, 0.5826644897460938, 0.5988349914550781, 0.6150054931640625, 0.6311759948730469, 0.6473464965820312, 0.6635169982910156, 0.6796875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 4.0, 12.0, 9.0, 23.0, 26.0, 29.0, 52.0, 50.0, 57.0, 68.0, 70.0, 85.0, 69.0, 81.0, 66.0, 65.0, 59.0, 50.0, 39.0, 31.0, 15.0, 14.0, 11.0, 5.0, 6.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.3081207275390625, -1.246124267578125, -1.1841278076171875, -1.12213134765625, -1.0601348876953125, -0.998138427734375, -0.9361419677734375, -0.8741455078125, -0.8121490478515625, -0.750152587890625, -0.6881561279296875, -0.62615966796875, -0.5641632080078125, -0.502166748046875, -0.4401702880859375, -0.378173828125, -0.3161773681640625, -0.254180908203125, -0.1921844482421875, -0.13018798828125, -0.0681915283203125, -0.006195068359375, 0.0558013916015625, 0.1177978515625, 0.1797943115234375, 0.241790771484375, 0.3037872314453125, 0.36578369140625, 0.4277801513671875, 0.489776611328125, 0.5517730712890625, 0.61376953125, 0.6757659912109375, 0.737762451171875, 0.7997589111328125, 0.86175537109375, 0.9237518310546875, 0.985748291015625, 1.0477447509765625, 1.1097412109375, 1.1717376708984375, 1.233734130859375, 1.2957305908203125, 1.35772705078125, 1.4197235107421875, 1.481719970703125, 1.5437164306640625, 1.605712890625, 1.6677093505859375, 1.729705810546875, 1.7917022705078125, 1.85369873046875, 1.9156951904296875, 1.977691650390625, 2.0396881103515625, 2.1016845703125, 2.1636810302734375, 2.225677490234375, 2.2876739501953125, 2.34967041015625, 2.4116668701171875, 2.473663330078125, 2.5356597900390625, 2.59765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 2.0, 3.0, 8.0, 9.0, 11.0, 10.0, 16.0, 12.0, 23.0, 21.0, 32.0, 58.0, 46.0, 88.0, 124.0, 166.0, 282.0, 430.0, 994.0, 4642.0, 48591.0, 796180.0, 182880.0, 10697.0, 1533.0, 576.0, 309.0, 206.0, 138.0, 123.0, 83.0, 73.0, 47.0, 38.0, 17.0, 24.0, 24.0, 15.0, 4.0, 5.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.258056640625, -0.24874114990234375, -0.2394256591796875, -0.23011016845703125, -0.220794677734375, -0.21147918701171875, -0.2021636962890625, -0.19284820556640625, -0.18353271484375, -0.17421722412109375, -0.1649017333984375, -0.15558624267578125, -0.146270751953125, -0.13695526123046875, -0.1276397705078125, -0.11832427978515625, -0.1090087890625, -0.09969329833984375, -0.0903778076171875, -0.08106231689453125, -0.071746826171875, -0.06243133544921875, -0.0531158447265625, -0.04380035400390625, -0.03448486328125, -0.02516937255859375, -0.0158538818359375, -0.00653839111328125, 0.002777099609375, 0.01209259033203125, 0.0214080810546875, 0.03072357177734375, 0.0400390625, 0.04935455322265625, 0.0586700439453125, 0.06798553466796875, 0.077301025390625, 0.08661651611328125, 0.0959320068359375, 0.10524749755859375, 0.11456298828125, 0.12387847900390625, 0.1331939697265625, 0.14250946044921875, 0.151824951171875, 0.16114044189453125, 0.1704559326171875, 0.17977142333984375, 0.1890869140625, 0.19840240478515625, 0.2077178955078125, 0.21703338623046875, 0.226348876953125, 0.23566436767578125, 0.2449798583984375, 0.25429534912109375, 0.26361083984375, 0.27292633056640625, 0.2822418212890625, 0.29155731201171875, 0.300872802734375, 0.31018829345703125, 0.3195037841796875, 0.32881927490234375, 0.338134765625]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 6.0, 6.0, 13.0, 6.0, 6.0, 14.0, 5.0, 13.0, 18.0, 17.0, 32.0, 26.0, 37.0, 35.0, 40.0, 56.0, 60.0, 42.0, 50.0, 43.0, 55.0, 66.0, 53.0, 41.0, 35.0, 33.0, 33.0, 33.0, 21.0, 21.0, 24.0, 10.0, 10.0, 10.0, 8.0, 6.0, 7.0, 5.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.341094970703125, -2.25054931640625, -2.160003662109375, -2.0694580078125, -1.978912353515625, -1.88836669921875, -1.797821044921875, -1.707275390625, -1.616729736328125, -1.52618408203125, -1.435638427734375, -1.3450927734375, -1.254547119140625, -1.16400146484375, -1.073455810546875, -0.98291015625, -0.892364501953125, -0.80181884765625, -0.711273193359375, -0.6207275390625, -0.530181884765625, -0.43963623046875, -0.349090576171875, -0.258544921875, -0.167999267578125, -0.07745361328125, 0.013092041015625, 0.1036376953125, 0.194183349609375, 0.28472900390625, 0.375274658203125, 0.4658203125, 0.556365966796875, 0.64691162109375, 0.737457275390625, 0.8280029296875, 0.918548583984375, 1.00909423828125, 1.099639892578125, 1.190185546875, 1.280731201171875, 1.37127685546875, 1.461822509765625, 1.5523681640625, 1.642913818359375, 1.73345947265625, 1.824005126953125, 1.91455078125, 2.005096435546875, 2.09564208984375, 2.186187744140625, 2.2767333984375, 2.367279052734375, 2.45782470703125, 2.548370361328125, 2.638916015625, 2.729461669921875, 2.82000732421875, 2.910552978515625, 3.0010986328125, 3.091644287109375, 3.18218994140625, 3.272735595703125, 3.36328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 9.0, 9.0, 12.0, 20.0, 24.0, 39.0, 57.0, 97.0, 192.0, 394.0, 981.0, 13344.0, 1023689.0, 8018.0, 880.0, 306.0, 157.0, 104.0, 77.0, 54.0, 26.0, 20.0, 8.0, 9.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1646728515625, -0.16002655029296875, -0.1553802490234375, -0.15073394775390625, -0.146087646484375, -0.14144134521484375, -0.1367950439453125, -0.13214874267578125, -0.12750244140625, -0.12285614013671875, -0.1182098388671875, -0.11356353759765625, -0.108917236328125, -0.10427093505859375, -0.0996246337890625, -0.09497833251953125, -0.09033203125, -0.08568572998046875, -0.0810394287109375, -0.07639312744140625, -0.071746826171875, -0.06710052490234375, -0.0624542236328125, -0.05780792236328125, -0.05316162109375, -0.04851531982421875, -0.0438690185546875, -0.03922271728515625, -0.034576416015625, -0.02993011474609375, -0.0252838134765625, -0.02063751220703125, -0.0159912109375, -0.01134490966796875, -0.0066986083984375, -0.00205230712890625, 0.002593994140625, 0.00724029541015625, 0.0118865966796875, 0.01653289794921875, 0.02117919921875, 0.02582550048828125, 0.0304718017578125, 0.03511810302734375, 0.039764404296875, 0.04441070556640625, 0.0490570068359375, 0.05370330810546875, 0.058349609375, 0.06299591064453125, 0.0676422119140625, 0.07228851318359375, 0.076934814453125, 0.08158111572265625, 0.0862274169921875, 0.09087371826171875, 0.09552001953125, 0.10016632080078125, 0.1048126220703125, 0.10945892333984375, 0.114105224609375, 0.11875152587890625, 0.1233978271484375, 0.12804412841796875, 0.1326904296875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 2.0, 15.0, 21.0, 20.0, 44.0, 76.0, 169.0, 221.0, 165.0, 114.0, 49.0, 34.0, 17.0, 19.0, 14.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.930662155151367e-05, -5.791615694761276e-05, -5.652569234371185e-05, -5.5135227739810944e-05, -5.3744763135910034e-05, -5.2354298532009125e-05, -5.0963833928108215e-05, -4.9573369324207306e-05, -4.8182904720306396e-05, -4.679244011640549e-05, -4.540197551250458e-05, -4.401151090860367e-05, -4.262104630470276e-05, -4.123058170080185e-05, -3.984011709690094e-05, -3.844965249300003e-05, -3.705918788909912e-05, -3.566872328519821e-05, -3.42782586812973e-05, -3.288779407739639e-05, -3.1497329473495483e-05, -3.0106864869594574e-05, -2.8716400265693665e-05, -2.7325935661792755e-05, -2.5935471057891846e-05, -2.4545006453990936e-05, -2.3154541850090027e-05, -2.1764077246189117e-05, -2.0373612642288208e-05, -1.89831480383873e-05, -1.759268343448639e-05, -1.620221883058548e-05, -1.481175422668457e-05, -1.3421289622783661e-05, -1.2030825018882751e-05, -1.0640360414981842e-05, -9.249895811080933e-06, -7.859431207180023e-06, -6.468966603279114e-06, -5.078501999378204e-06, -3.688037395477295e-06, -2.2975727915763855e-06, -9.071081876754761e-07, 4.833564162254333e-07, 1.8738210201263428e-06, 3.264285624027252e-06, 4.654750227928162e-06, 6.045214831829071e-06, 7.4356794357299805e-06, 8.82614403963089e-06, 1.02166086435318e-05, 1.1607073247432709e-05, 1.2997537851333618e-05, 1.4388002455234528e-05, 1.5778467059135437e-05, 1.7168931663036346e-05, 1.8559396266937256e-05, 1.9949860870838165e-05, 2.1340325474739075e-05, 2.2730790078639984e-05, 2.4121254682540894e-05, 2.5511719286441803e-05, 2.6902183890342712e-05, 2.8292648494243622e-05, 2.968311309814453e-05]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 11.0, 10.0, 22.0, 29.0, 59.0, 73.0, 149.0, 246.0, 413.0, 807.0, 1691.0, 4619.0, 18023.0, 275116.0, 713034.0, 24600.0, 5710.0, 1947.0, 874.0, 485.0, 259.0, 138.0, 95.0, 52.0, 33.0, 24.0, 18.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1229248046875, -0.11951828002929688, -0.11611175537109375, -0.11270523071289062, -0.1092987060546875, -0.10589218139648438, -0.10248565673828125, -0.09907913208007812, -0.095672607421875, -0.09226608276367188, -0.08885955810546875, -0.08545303344726562, -0.0820465087890625, -0.07863998413085938, -0.07523345947265625, -0.07182693481445312, -0.06842041015625, -0.06501388549804688, -0.06160736083984375, -0.058200836181640625, -0.0547943115234375, -0.051387786865234375, -0.04798126220703125, -0.044574737548828125, -0.041168212890625, -0.037761688232421875, -0.03435516357421875, -0.030948638916015625, -0.0275421142578125, -0.024135589599609375, -0.02072906494140625, -0.017322540283203125, -0.013916015625, -0.010509490966796875, -0.00710296630859375, -0.003696441650390625, -0.0002899169921875, 0.003116607666015625, 0.00652313232421875, 0.009929656982421875, 0.013336181640625, 0.016742706298828125, 0.02014923095703125, 0.023555755615234375, 0.0269622802734375, 0.030368804931640625, 0.03377532958984375, 0.037181854248046875, 0.04058837890625, 0.043994903564453125, 0.04740142822265625, 0.050807952880859375, 0.0542144775390625, 0.057621002197265625, 0.06102752685546875, 0.06443405151367188, 0.067840576171875, 0.07124710083007812, 0.07465362548828125, 0.07806015014648438, 0.0814666748046875, 0.08487319946289062, 0.08827972412109375, 0.09168624877929688, 0.0950927734375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 9.0, 2.0, 7.0, 3.0, 9.0, 11.0, 16.0, 21.0, 51.0, 96.0, 313.0, 258.0, 96.0, 41.0, 24.0, 18.0, 5.0, 6.0, 9.0, 4.0, 7.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03143310546875, -0.030305862426757812, -0.029178619384765625, -0.028051376342773438, -0.02692413330078125, -0.025796890258789062, -0.024669647216796875, -0.023542404174804688, -0.0224151611328125, -0.021287918090820312, -0.020160675048828125, -0.019033432006835938, -0.01790618896484375, -0.016778945922851562, -0.015651702880859375, -0.014524459838867188, -0.013397216796875, -0.012269973754882812, -0.011142730712890625, -0.010015487670898438, -0.00888824462890625, -0.0077610015869140625, -0.006633758544921875, -0.0055065155029296875, -0.0043792724609375, -0.0032520294189453125, -0.002124786376953125, -0.0009975433349609375, 0.00012969970703125, 0.0012569427490234375, 0.002384185791015625, 0.0035114288330078125, 0.004638671875, 0.0057659149169921875, 0.006893157958984375, 0.008020401000976562, 0.00914764404296875, 0.010274887084960938, 0.011402130126953125, 0.012529373168945312, 0.0136566162109375, 0.014783859252929688, 0.015911102294921875, 0.017038345336914062, 0.01816558837890625, 0.019292831420898438, 0.020420074462890625, 0.021547317504882812, 0.022674560546875, 0.023801803588867188, 0.024929046630859375, 0.026056289672851562, 0.02718353271484375, 0.028310775756835938, 0.029438018798828125, 0.030565261840820312, 0.0316925048828125, 0.03281974792480469, 0.033946990966796875, 0.03507423400878906, 0.03620147705078125, 0.03732872009277344, 0.038455963134765625, 0.03958320617675781, 0.04071044921875]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 4.0, 11.0, 15.0, 22.0, 29.0, 36.0, 72.0, 80.0, 76.0, 126.0, 94.0, 112.0, 96.0, 78.0, 50.0, 22.0, 29.0, 17.0, 8.0, 3.0, 8.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5251941680908203, -2.455779790878296, -2.3863654136657715, -2.316951274871826, -2.2475368976593018, -2.1781225204467773, -2.108708143234253, -2.0392937660217285, -1.9698795080184937, -1.9004651308059692, -1.8310508728027344, -1.76163649559021, -1.6922221183776855, -1.6228078603744507, -1.5533934831619263, -1.4839792251586914, -1.414564847946167, -1.3451504707336426, -1.2757362127304077, -1.2063218355178833, -1.1369075775146484, -1.067493200302124, -0.9980788230895996, -0.92866450548172, -0.8592501878738403, -0.7898358702659607, -0.720421552658081, -0.6510071754455566, -0.581592857837677, -0.5121785402297974, -0.44276419281959534, -0.3733498454093933, -0.3039356470108032, -0.2345213145017624, -0.16510698199272156, -0.09569264948368073, -0.026278316974639893, 0.043136000633239746, 0.11255034804344177, 0.1819646954536438, 0.25137901306152344, 0.3207933306694031, 0.3902076780796051, 0.45962202548980713, 0.5290363430976868, 0.5984506607055664, 0.6678650379180908, 0.7372793555259705, 0.8066936731338501, 0.8761079907417297, 0.9455223083496094, 1.0149366855621338, 1.0843510627746582, 1.153765320777893, 1.2231796979904175, 1.2925939559936523, 1.3620083332061768, 1.4314227104187012, 1.500836968421936, 1.5702513456344604, 1.6396656036376953, 1.7090799808502197, 1.7784943580627441, 1.8479087352752686, 1.9173229932785034]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 6.0, 26.0, 25.0, 33.0, 47.0, 52.0, 64.0, 74.0, 69.0, 76.0, 69.0, 75.0, 75.0, 59.0, 59.0, 47.0, 40.0, 30.0, 20.0, 13.0, 9.0, 4.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3186020851135254, -1.2591097354888916, -1.1996172666549683, -1.1401249170303345, -1.0806325674057007, -1.0211400985717773, -0.9616477489471436, -0.9021553993225098, -0.8426629900932312, -0.7831705808639526, -0.7236782312393188, -0.6641858220100403, -0.6046934127807617, -0.5452010631561279, -0.48570865392684937, -0.4262162744998932, -0.366723895072937, -0.30723151564598083, -0.24773912131786346, -0.1882467269897461, -0.12875434756278992, -0.06926196813583374, -0.009769558906555176, 0.049722820520401, 0.10921519994735718, 0.16870757937431335, 0.22819997370243073, 0.2876923680305481, 0.3471847474575043, 0.40667712688446045, 0.466169536113739, 0.5256619453430176, 0.5851542949676514, 0.6446467041969299, 0.7041390538215637, 0.7636314630508423, 0.8231238126754761, 0.8826162219047546, 0.9421086311340332, 1.001600980758667, 1.0610933303833008, 1.1205856800079346, 1.180078148841858, 1.2395704984664917, 1.2990628480911255, 1.3585553169250488, 1.4180476665496826, 1.4775400161743164, 1.5370324850082397, 1.5965248346328735, 1.6560173034667969, 1.7155096530914307, 1.7750020027160645, 1.8344943523406982, 1.8939868211746216, 1.9534791707992554, 2.0129716396331787, 2.0724639892578125, 2.1319563388824463, 2.19144868850708, 2.250941276550293, 2.3104336261749268, 2.3699259757995605, 2.4294183254241943, 2.488910675048828]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 8.0, 12.0, 23.0, 27.0, 35.0, 42.0, 77.0, 106.0, 136.0, 215.0, 317.0, 439.0, 666.0, 1109.0, 1686.0, 2792.0, 4821.0, 8745.0, 16475.0, 35723.0, 92560.0, 386242.0, 342871.0, 84285.0, 33156.0, 15657.0, 8216.0, 4579.0, 2707.0, 1689.0, 1068.0, 691.0, 413.0, 302.0, 191.0, 131.0, 91.0, 81.0, 57.0, 26.0, 23.0, 16.0, 15.0, 5.0, 3.0, 3.0, 4.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.6640625, -1.6135711669921875, -1.563079833984375, -1.5125885009765625, -1.46209716796875, -1.4116058349609375, -1.361114501953125, -1.3106231689453125, -1.2601318359375, -1.2096405029296875, -1.159149169921875, -1.1086578369140625, -1.05816650390625, -1.0076751708984375, -0.957183837890625, -0.9066925048828125, -0.856201171875, -0.8057098388671875, -0.755218505859375, -0.7047271728515625, -0.65423583984375, -0.6037445068359375, -0.553253173828125, -0.5027618408203125, -0.4522705078125, -0.4017791748046875, -0.351287841796875, -0.3007965087890625, -0.25030517578125, -0.1998138427734375, -0.149322509765625, -0.0988311767578125, -0.04833984375, 0.0021514892578125, 0.052642822265625, 0.1031341552734375, 0.15362548828125, 0.2041168212890625, 0.254608154296875, 0.3050994873046875, 0.3555908203125, 0.4060821533203125, 0.456573486328125, 0.5070648193359375, 0.55755615234375, 0.6080474853515625, 0.658538818359375, 0.7090301513671875, 0.759521484375, 0.8100128173828125, 0.860504150390625, 0.9109954833984375, 0.96148681640625, 1.0119781494140625, 1.062469482421875, 1.1129608154296875, 1.1634521484375, 1.2139434814453125, 1.264434814453125, 1.3149261474609375, 1.36541748046875, 1.4159088134765625, 1.466400146484375, 1.5168914794921875, 1.5673828125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 7.0, 5.0, 7.0, 16.0, 14.0, 36.0, 32.0, 41.0, 60.0, 61.0, 65.0, 71.0, 74.0, 65.0, 83.0, 56.0, 70.0, 44.0, 47.0, 41.0, 27.0, 23.0, 18.0, 8.0, 9.0, 7.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.298828125, -3.185882568359375, -3.07293701171875, -2.959991455078125, -2.8470458984375, -2.734100341796875, -2.62115478515625, -2.508209228515625, -2.395263671875, -2.282318115234375, -2.16937255859375, -2.056427001953125, -1.9434814453125, -1.830535888671875, -1.71759033203125, -1.604644775390625, -1.49169921875, -1.378753662109375, -1.26580810546875, -1.152862548828125, -1.0399169921875, -0.926971435546875, -0.81402587890625, -0.701080322265625, -0.588134765625, -0.475189208984375, -0.36224365234375, -0.249298095703125, -0.1363525390625, -0.023406982421875, 0.08953857421875, 0.202484130859375, 0.3154296875, 0.428375244140625, 0.54132080078125, 0.654266357421875, 0.7672119140625, 0.880157470703125, 0.99310302734375, 1.106048583984375, 1.218994140625, 1.331939697265625, 1.44488525390625, 1.557830810546875, 1.6707763671875, 1.783721923828125, 1.89666748046875, 2.009613037109375, 2.12255859375, 2.235504150390625, 2.34844970703125, 2.461395263671875, 2.5743408203125, 2.687286376953125, 2.80023193359375, 2.913177490234375, 3.026123046875, 3.139068603515625, 3.25201416015625, 3.364959716796875, 3.4779052734375, 3.590850830078125, 3.70379638671875, 3.816741943359375, 3.9296875]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 9.0, 10.0, 20.0, 19.0, 51.0, 62.0, 104.0, 218.0, 381.0, 805.0, 2014.0, 5645.0, 21378.0, 112933.0, 762737.0, 111559.0, 21301.0, 5680.0, 1947.0, 821.0, 371.0, 202.0, 118.0, 72.0, 38.0, 22.0, 11.0, 10.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0], "bins": [-4.62109375, -4.517242431640625, -4.41339111328125, -4.309539794921875, -4.2056884765625, -4.101837158203125, -3.99798583984375, -3.894134521484375, -3.790283203125, -3.686431884765625, -3.58258056640625, -3.478729248046875, -3.3748779296875, -3.271026611328125, -3.16717529296875, -3.063323974609375, -2.95947265625, -2.855621337890625, -2.75177001953125, -2.647918701171875, -2.5440673828125, -2.440216064453125, -2.33636474609375, -2.232513427734375, -2.128662109375, -2.024810791015625, -1.92095947265625, -1.817108154296875, -1.7132568359375, -1.609405517578125, -1.50555419921875, -1.401702880859375, -1.2978515625, -1.194000244140625, -1.09014892578125, -0.986297607421875, -0.8824462890625, -0.778594970703125, -0.67474365234375, -0.570892333984375, -0.467041015625, -0.363189697265625, -0.25933837890625, -0.155487060546875, -0.0516357421875, 0.052215576171875, 0.15606689453125, 0.259918212890625, 0.36376953125, 0.467620849609375, 0.57147216796875, 0.675323486328125, 0.7791748046875, 0.883026123046875, 0.98687744140625, 1.090728759765625, 1.194580078125, 1.298431396484375, 1.40228271484375, 1.506134033203125, 1.6099853515625, 1.713836669921875, 1.81768798828125, 1.921539306640625, 2.025390625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 0.0, 8.0, 7.0, 3.0, 8.0, 9.0, 9.0, 11.0, 20.0, 25.0, 34.0, 36.0, 35.0, 47.0, 40.0, 55.0, 49.0, 66.0, 56.0, 55.0, 59.0, 54.0, 59.0, 45.0, 40.0, 27.0, 28.0, 32.0, 19.0, 18.0, 16.0, 6.0, 6.0, 5.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.34765625, -4.21820068359375, -4.0887451171875, -3.95928955078125, -3.829833984375, -3.70037841796875, -3.5709228515625, -3.44146728515625, -3.31201171875, -3.18255615234375, -3.0531005859375, -2.92364501953125, -2.794189453125, -2.66473388671875, -2.5352783203125, -2.40582275390625, -2.2763671875, -2.14691162109375, -2.0174560546875, -1.88800048828125, -1.758544921875, -1.62908935546875, -1.4996337890625, -1.37017822265625, -1.24072265625, -1.11126708984375, -0.9818115234375, -0.85235595703125, -0.722900390625, -0.59344482421875, -0.4639892578125, -0.33453369140625, -0.205078125, -0.07562255859375, 0.0538330078125, 0.18328857421875, 0.312744140625, 0.44219970703125, 0.5716552734375, 0.70111083984375, 0.83056640625, 0.96002197265625, 1.0894775390625, 1.21893310546875, 1.348388671875, 1.47784423828125, 1.6072998046875, 1.73675537109375, 1.8662109375, 1.99566650390625, 2.1251220703125, 2.25457763671875, 2.384033203125, 2.51348876953125, 2.6429443359375, 2.77239990234375, 2.90185546875, 3.03131103515625, 3.1607666015625, 3.29022216796875, 3.419677734375, 3.54913330078125, 3.6785888671875, 3.80804443359375, 3.9375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 2.0, 11.0, 5.0, 11.0, 25.0, 24.0, 39.0, 63.0, 95.0, 137.0, 241.0, 471.0, 1007.0, 2280.0, 5677.0, 18008.0, 69757.0, 357520.0, 471756.0, 87746.0, 21825.0, 6731.0, 2611.0, 1174.0, 574.0, 278.0, 151.0, 112.0, 62.0, 43.0, 27.0, 21.0, 11.0, 13.0, 10.0, 12.0, 3.0, 7.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.71337890625, -0.69244384765625, -0.6715087890625, -0.65057373046875, -0.629638671875, -0.60870361328125, -0.5877685546875, -0.56683349609375, -0.5458984375, -0.52496337890625, -0.5040283203125, -0.48309326171875, -0.462158203125, -0.44122314453125, -0.4202880859375, -0.39935302734375, -0.37841796875, -0.35748291015625, -0.3365478515625, -0.31561279296875, -0.294677734375, -0.27374267578125, -0.2528076171875, -0.23187255859375, -0.2109375, -0.19000244140625, -0.1690673828125, -0.14813232421875, -0.127197265625, -0.10626220703125, -0.0853271484375, -0.06439208984375, -0.04345703125, -0.02252197265625, -0.0015869140625, 0.01934814453125, 0.040283203125, 0.06121826171875, 0.0821533203125, 0.10308837890625, 0.1240234375, 0.14495849609375, 0.1658935546875, 0.18682861328125, 0.207763671875, 0.22869873046875, 0.2496337890625, 0.27056884765625, 0.29150390625, 0.31243896484375, 0.3333740234375, 0.35430908203125, 0.375244140625, 0.39617919921875, 0.4171142578125, 0.43804931640625, 0.458984375, 0.47991943359375, 0.5008544921875, 0.52178955078125, 0.542724609375, 0.56365966796875, 0.5845947265625, 0.60552978515625, 0.62646484375]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 3.0, 1.0, 5.0, 7.0, 10.0, 8.0, 12.0, 12.0, 18.0, 32.0, 36.0, 48.0, 42.0, 83.0, 118.0, 127.0, 98.0, 84.0, 56.0, 56.0, 30.0, 29.0, 15.0, 12.0, 11.0, 14.0, 14.0, 7.0, 4.0, 2.0, 1.0, 0.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010097026824951172, -9.754952043294907e-05, -9.412877261638641e-05, -9.070802479982376e-05, -8.728727698326111e-05, -8.386652916669846e-05, -8.04457813501358e-05, -7.702503353357315e-05, -7.36042857170105e-05, -7.018353790044785e-05, -6.676279008388519e-05, -6.334204226732254e-05, -5.992129445075989e-05, -5.6500546634197235e-05, -5.307979881763458e-05, -4.965905100107193e-05, -4.623830318450928e-05, -4.2817555367946625e-05, -3.939680755138397e-05, -3.597605973482132e-05, -3.255531191825867e-05, -2.9134564101696014e-05, -2.5713816285133362e-05, -2.229306846857071e-05, -1.8872320652008057e-05, -1.5451572835445404e-05, -1.2030825018882751e-05, -8.610077202320099e-06, -5.189329385757446e-06, -1.7685815691947937e-06, 1.6521662473678589e-06, 5.0729140639305115e-06, 8.493661880493164e-06, 1.1914409697055817e-05, 1.533515751361847e-05, 1.8755905330181122e-05, 2.2176653146743774e-05, 2.5597400963306427e-05, 2.901814877986908e-05, 3.243889659643173e-05, 3.5859644412994385e-05, 3.928039222955704e-05, 4.270114004611969e-05, 4.612188786268234e-05, 4.9542635679244995e-05, 5.296338349580765e-05, 5.63841313123703e-05, 5.980487912893295e-05, 6.32256269454956e-05, 6.664637476205826e-05, 7.006712257862091e-05, 7.348787039518356e-05, 7.690861821174622e-05, 8.032936602830887e-05, 8.375011384487152e-05, 8.717086166143417e-05, 9.059160947799683e-05, 9.401235729455948e-05, 9.743310511112213e-05, 0.00010085385292768478, 0.00010427460074424744, 0.00010769534856081009, 0.00011111609637737274, 0.0001145368441939354, 0.00011795759201049805]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 4.0, 4.0, 9.0, 10.0, 12.0, 13.0, 12.0, 24.0, 38.0, 71.0, 143.0, 278.0, 608.0, 1494.0, 4389.0, 15382.0, 70665.0, 458457.0, 411332.0, 64713.0, 14231.0, 4074.0, 1425.0, 564.0, 267.0, 125.0, 72.0, 52.0, 20.0, 15.0, 16.0, 5.0, 12.0, 9.0, 2.0, 3.0, 3.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85791015625, -0.8326568603515625, -0.807403564453125, -0.7821502685546875, -0.75689697265625, -0.7316436767578125, -0.706390380859375, -0.6811370849609375, -0.6558837890625, -0.6306304931640625, -0.605377197265625, -0.5801239013671875, -0.55487060546875, -0.5296173095703125, -0.504364013671875, -0.4791107177734375, -0.453857421875, -0.4286041259765625, -0.403350830078125, -0.3780975341796875, -0.35284423828125, -0.3275909423828125, -0.302337646484375, -0.2770843505859375, -0.2518310546875, -0.2265777587890625, -0.201324462890625, -0.1760711669921875, -0.15081787109375, -0.1255645751953125, -0.100311279296875, -0.0750579833984375, -0.0498046875, -0.0245513916015625, 0.000701904296875, 0.0259552001953125, 0.05120849609375, 0.0764617919921875, 0.101715087890625, 0.1269683837890625, 0.1522216796875, 0.1774749755859375, 0.202728271484375, 0.2279815673828125, 0.25323486328125, 0.2784881591796875, 0.303741455078125, 0.3289947509765625, 0.354248046875, 0.3795013427734375, 0.404754638671875, 0.4300079345703125, 0.45526123046875, 0.4805145263671875, 0.505767822265625, 0.5310211181640625, 0.5562744140625, 0.5815277099609375, 0.606781005859375, 0.6320343017578125, 0.65728759765625, 0.6825408935546875, 0.707794189453125, 0.7330474853515625, 0.75830078125]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 3.0, 4.0, 8.0, 4.0, 8.0, 14.0, 12.0, 18.0, 16.0, 22.0, 28.0, 32.0, 35.0, 49.0, 73.0, 77.0, 122.0, 83.0, 90.0, 54.0, 56.0, 38.0, 25.0, 26.0, 18.0, 13.0, 12.0, 21.0, 9.0, 2.0, 6.0, 4.0, 2.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.37451171875, -0.364105224609375, -0.35369873046875, -0.343292236328125, -0.3328857421875, -0.322479248046875, -0.31207275390625, -0.301666259765625, -0.291259765625, -0.280853271484375, -0.27044677734375, -0.260040283203125, -0.2496337890625, -0.239227294921875, -0.22882080078125, -0.218414306640625, -0.2080078125, -0.197601318359375, -0.18719482421875, -0.176788330078125, -0.1663818359375, -0.155975341796875, -0.14556884765625, -0.135162353515625, -0.124755859375, -0.114349365234375, -0.10394287109375, -0.093536376953125, -0.0831298828125, -0.072723388671875, -0.06231689453125, -0.051910400390625, -0.04150390625, -0.031097412109375, -0.02069091796875, -0.010284423828125, 0.0001220703125, 0.010528564453125, 0.02093505859375, 0.031341552734375, 0.041748046875, 0.052154541015625, 0.06256103515625, 0.072967529296875, 0.0833740234375, 0.093780517578125, 0.10418701171875, 0.114593505859375, 0.125, 0.135406494140625, 0.14581298828125, 0.156219482421875, 0.1666259765625, 0.177032470703125, 0.18743896484375, 0.197845458984375, 0.208251953125, 0.218658447265625, 0.22906494140625, 0.239471435546875, 0.2498779296875, 0.260284423828125, 0.27069091796875, 0.281097412109375, 0.29150390625]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 5.0, 41.0, 407.0, 490.0, 67.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0273895263671875, -3.052302837371826, -2.077216148376465, -1.1021292209625244, -0.12704253196716309, 0.8480443954467773, 1.8231310844421387, 2.7982177734375, 3.7733044624328613, 4.748391151428223, 5.723477840423584, 6.698564529418945, 7.673651695251465, 8.648738861083984, 9.623825073242188, 10.59891128540039, 11.57399845123291, 12.54908561706543, 13.524171829223633, 14.499258995056152, 15.474345207214355, 16.449432373046875, 17.424518585205078, 18.39960479736328, 19.374692916870117, 20.34977912902832, 21.324867248535156, 22.29995346069336, 23.275039672851562, 24.250125885009766, 25.2252140045166, 26.200300216674805, 27.175386428833008, 28.15047264099121, 29.125560760498047, 30.10064697265625, 31.075733184814453, 32.050819396972656, 33.02590560913086, 34.00099182128906, 34.97608184814453, 35.951168060302734, 36.92625427246094, 37.90134048461914, 38.87643051147461, 39.85151672363281, 40.826602935791016, 41.80168914794922, 42.77677536010742, 43.751861572265625, 44.72694778442383, 45.70203399658203, 46.6771240234375, 47.6522102355957, 48.627296447753906, 49.60238265991211, 50.57746887207031, 51.552555084228516, 52.52764129638672, 53.50272750854492, 54.47781753540039, 55.452903747558594, 56.4279899597168, 57.403076171875, 58.3781623840332]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 7.0, 3.0, 3.0, 4.0, 4.0, 3.0, 5.0, 12.0, 8.0, 9.0, 24.0, 17.0, 25.0, 21.0, 27.0, 24.0, 43.0, 24.0, 27.0, 35.0, 34.0, 47.0, 44.0, 37.0, 32.0, 33.0, 34.0, 41.0, 36.0, 46.0, 35.0, 33.0, 28.0, 18.0, 24.0, 25.0, 22.0, 27.0, 19.0, 17.0, 11.0, 10.0, 3.0, 8.0, 8.0, 3.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.838257312774658, -5.665676116943359, -5.4930949211120605, -5.320513725280762, -5.147933006286621, -4.975351810455322, -4.802770614624023, -4.630189418792725, -4.457608222961426, -4.285027027130127, -4.112445831298828, -3.9398648738861084, -3.7672836780548096, -3.5947024822235107, -3.422121524810791, -3.249540328979492, -3.0769591331481934, -2.9043779373168945, -2.7317967414855957, -2.559215784072876, -2.386634588241577, -2.2140533924102783, -2.0414724349975586, -1.8688912391662598, -1.696310043334961, -1.523728847503662, -1.3511477708816528, -1.1785666942596436, -1.0059854984283447, -0.8334043622016907, -0.6608232259750366, -0.48824214935302734, -0.3156609535217285, -0.14307981729507446, 0.02950131893157959, 0.20208245515823364, 0.3746635913848877, 0.5472447276115417, 0.7198258638381958, 0.8924069404602051, 1.064988136291504, 1.2375693321228027, 1.410150408744812, 1.5827314853668213, 1.7553126811981201, 1.927893877029419, 2.1004748344421387, 2.2730560302734375, 2.4456372261047363, 2.618218421936035, 2.790799617767334, 2.9633805751800537, 3.1359617710113525, 3.3085429668426514, 3.481123924255371, 3.65370512008667, 3.8262863159179688, 3.9988675117492676, 4.171448707580566, 4.344029903411865, 4.516611099243164, 4.689191818237305, 4.8617730140686035, 5.034354209899902, 5.206935405731201]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 8.0, 5.0, 10.0, 22.0, 20.0, 38.0, 51.0, 78.0, 130.0, 407.0, 1600.0, 11294.0, 458804.0, 3682739.0, 34607.0, 3283.0, 702.0, 221.0, 82.0, 65.0, 47.0, 31.0, 14.0, 7.0, 10.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.1015625, -4.8817138671875, -4.661865234375, -4.4420166015625, -4.22216796875, -4.0023193359375, -3.782470703125, -3.5626220703125, -3.3427734375, -3.1229248046875, -2.903076171875, -2.6832275390625, -2.46337890625, -2.2435302734375, -2.023681640625, -1.8038330078125, -1.583984375, -1.3641357421875, -1.144287109375, -0.9244384765625, -0.70458984375, -0.4847412109375, -0.264892578125, -0.0450439453125, 0.1748046875, 0.3946533203125, 0.614501953125, 0.8343505859375, 1.05419921875, 1.2740478515625, 1.493896484375, 1.7137451171875, 1.93359375, 2.1534423828125, 2.373291015625, 2.5931396484375, 2.81298828125, 3.0328369140625, 3.252685546875, 3.4725341796875, 3.6923828125, 3.9122314453125, 4.132080078125, 4.3519287109375, 4.57177734375, 4.7916259765625, 5.011474609375, 5.2313232421875, 5.451171875, 5.6710205078125, 5.890869140625, 6.1107177734375, 6.33056640625, 6.5504150390625, 6.770263671875, 6.9901123046875, 7.2099609375, 7.4298095703125, 7.649658203125, 7.8695068359375, 8.08935546875, 8.3092041015625, 8.529052734375, 8.7489013671875, 8.96875]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 6.0, 1.0, 6.0, 10.0, 13.0, 17.0, 27.0, 32.0, 38.0, 58.0, 38.0, 57.0, 74.0, 69.0, 74.0, 68.0, 73.0, 60.0, 61.0, 47.0, 44.0, 34.0, 27.0, 30.0, 10.0, 15.0, 5.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4636077880859375, -1.412567138671875, -1.3615264892578125, -1.31048583984375, -1.2594451904296875, -1.208404541015625, -1.1573638916015625, -1.1063232421875, -1.0552825927734375, -1.004241943359375, -0.9532012939453125, -0.90216064453125, -0.8511199951171875, -0.800079345703125, -0.7490386962890625, -0.697998046875, -0.6469573974609375, -0.595916748046875, -0.5448760986328125, -0.49383544921875, -0.4427947998046875, -0.391754150390625, -0.3407135009765625, -0.2896728515625, -0.2386322021484375, -0.187591552734375, -0.1365509033203125, -0.08551025390625, -0.0344696044921875, 0.016571044921875, 0.0676116943359375, 0.11865234375, 0.1696929931640625, 0.220733642578125, 0.2717742919921875, 0.32281494140625, 0.3738555908203125, 0.424896240234375, 0.4759368896484375, 0.5269775390625, 0.5780181884765625, 0.629058837890625, 0.6800994873046875, 0.73114013671875, 0.7821807861328125, 0.833221435546875, 0.8842620849609375, 0.935302734375, 0.9863433837890625, 1.037384033203125, 1.0884246826171875, 1.13946533203125, 1.1905059814453125, 1.241546630859375, 1.2925872802734375, 1.3436279296875, 1.3946685791015625, 1.445709228515625, 1.4967498779296875, 1.54779052734375, 1.5988311767578125, 1.649871826171875, 1.7009124755859375, 1.751953125]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 7.0, 12.0, 21.0, 23.0, 43.0, 58.0, 96.0, 139.0, 271.0, 652.0, 1904.0, 9090.0, 76131.0, 2773924.0, 1277031.0, 45817.0, 6301.0, 1575.0, 546.0, 263.0, 141.0, 61.0, 50.0, 33.0, 20.0, 21.0, 6.0, 11.0, 4.0, 8.0, 5.0, 0.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.02734375, -3.87762451171875, -3.7279052734375, -3.57818603515625, -3.428466796875, -3.27874755859375, -3.1290283203125, -2.97930908203125, -2.82958984375, -2.67987060546875, -2.5301513671875, -2.38043212890625, -2.230712890625, -2.08099365234375, -1.9312744140625, -1.78155517578125, -1.6318359375, -1.48211669921875, -1.3323974609375, -1.18267822265625, -1.032958984375, -0.88323974609375, -0.7335205078125, -0.58380126953125, -0.43408203125, -0.28436279296875, -0.1346435546875, 0.01507568359375, 0.164794921875, 0.31451416015625, 0.4642333984375, 0.61395263671875, 0.763671875, 0.91339111328125, 1.0631103515625, 1.21282958984375, 1.362548828125, 1.51226806640625, 1.6619873046875, 1.81170654296875, 1.96142578125, 2.11114501953125, 2.2608642578125, 2.41058349609375, 2.560302734375, 2.71002197265625, 2.8597412109375, 3.00946044921875, 3.1591796875, 3.30889892578125, 3.4586181640625, 3.60833740234375, 3.758056640625, 3.90777587890625, 4.0574951171875, 4.20721435546875, 4.35693359375, 4.50665283203125, 4.6563720703125, 4.80609130859375, 4.955810546875, 5.10552978515625, 5.2552490234375, 5.40496826171875, 5.5546875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 5.0, 4.0, 12.0, 12.0, 18.0, 27.0, 25.0, 57.0, 85.0, 113.0, 191.0, 228.0, 368.0, 549.0, 690.0, 518.0, 395.0, 228.0, 168.0, 105.0, 77.0, 50.0, 43.0, 30.0, 21.0, 19.0, 6.0, 9.0, 4.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1083984375, -1.0788192749023438, -1.0492401123046875, -1.0196609497070312, -0.990081787109375, -0.9605026245117188, -0.9309234619140625, -0.9013442993164062, -0.87176513671875, -0.8421859741210938, -0.8126068115234375, -0.7830276489257812, -0.753448486328125, -0.7238693237304688, -0.6942901611328125, -0.6647109985351562, -0.6351318359375, -0.6055526733398438, -0.5759735107421875, -0.5463943481445312, -0.516815185546875, -0.48723602294921875, -0.4576568603515625, -0.42807769775390625, -0.39849853515625, -0.36891937255859375, -0.3393402099609375, -0.30976104736328125, -0.280181884765625, -0.25060272216796875, -0.2210235595703125, -0.19144439697265625, -0.161865234375, -0.13228607177734375, -0.1027069091796875, -0.07312774658203125, -0.043548583984375, -0.01396942138671875, 0.0156097412109375, 0.04518890380859375, 0.07476806640625, 0.10434722900390625, 0.1339263916015625, 0.16350555419921875, 0.193084716796875, 0.22266387939453125, 0.2522430419921875, 0.28182220458984375, 0.3114013671875, 0.34098052978515625, 0.3705596923828125, 0.40013885498046875, 0.429718017578125, 0.45929718017578125, 0.4888763427734375, 0.5184555053710938, 0.54803466796875, 0.5776138305664062, 0.6071929931640625, 0.6367721557617188, 0.666351318359375, 0.6959304809570312, 0.7255096435546875, 0.7550888061523438, 0.78466796875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 13.0, 11.0, 29.0, 31.0, 36.0, 54.0, 66.0, 67.0, 86.0, 85.0, 90.0, 92.0, 67.0, 54.0, 52.0, 46.0, 28.0, 31.0, 15.0, 13.0, 10.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7800548076629639, -1.679813027381897, -1.57957124710083, -1.4793293476104736, -1.3790875673294067, -1.2788457870483398, -1.1786038875579834, -1.0783621072769165, -0.9781203269958496, -0.8778785467147827, -0.777636706829071, -0.6773948669433594, -0.5771530866622925, -0.4769113063812256, -0.3766694664955139, -0.27642762660980225, -0.17618584632873535, -0.07594403624534607, 0.024297773838043213, 0.1245395839214325, 0.22478139400482178, 0.32502317428588867, 0.42526501417160034, 0.525506854057312, 0.6257486343383789, 0.7259904146194458, 0.8262322545051575, 0.9264740943908691, 1.026715874671936, 1.126957654953003, 1.2271995544433594, 1.3274413347244263, 1.4276833534240723, 1.5279251337051392, 1.628166913986206, 1.7284088134765625, 1.8286505937576294, 1.9288923740386963, 2.0291342735290527, 2.12937593460083, 2.2296178340911865, 2.329859733581543, 2.4301013946533203, 2.5303432941436768, 2.630585193634033, 2.7308268547058105, 2.831068754196167, 2.9313106536865234, 3.031552314758301, 3.1317942142486572, 3.2320358753204346, 3.332277774810791, 3.4325194358825684, 3.532761335372925, 3.6330032348632812, 3.7332448959350586, 3.833486795425415, 3.9337286949157715, 4.033970355987549, 4.134212017059326, 4.234454154968262, 4.334695816040039, 4.434937477111816, 4.535179615020752, 4.635421276092529]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 2.0, 1.0, 3.0, 7.0, 6.0, 10.0, 9.0, 12.0, 9.0, 18.0, 20.0, 18.0, 24.0, 34.0, 35.0, 25.0, 44.0, 45.0, 49.0, 34.0, 43.0, 36.0, 45.0, 45.0, 59.0, 40.0, 33.0, 38.0, 37.0, 43.0, 21.0, 32.0, 22.0, 20.0, 17.0, 11.0, 6.0, 14.0, 10.0, 3.0, 8.0, 4.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4243059158325195, -1.3674544095993042, -1.3106030225753784, -1.253751516342163, -1.1969001293182373, -1.140048623085022, -1.0831971168518066, -1.0263457298278809, -0.9694942235946655, -0.912642776966095, -0.8557913303375244, -0.7989398241043091, -0.7420883774757385, -0.685236930847168, -0.6283854842185974, -0.5715340375900269, -0.5146825909614563, -0.45783114433288574, -0.4009796679019928, -0.34412822127342224, -0.2872767448425293, -0.23042529821395874, -0.17357385158538818, -0.11672237515449524, -0.05987092852592468, -0.0030194707214832306, 0.05383198708295822, 0.11068344116210938, 0.16753490269184113, 0.22438636422157288, 0.28123781085014343, 0.3380892872810364, 0.39494073390960693, 0.4517921805381775, 0.508643627166748, 0.5654951333999634, 0.6223465800285339, 0.6791980266571045, 0.736049473285675, 0.7929009199142456, 0.8497524261474609, 0.9066038727760315, 0.963455319404602, 1.0203068256378174, 1.0771582126617432, 1.1340097188949585, 1.1908612251281738, 1.2477126121520996, 1.3045639991760254, 1.3614155054092407, 1.4182668924331665, 1.4751183986663818, 1.5319697856903076, 1.588821291923523, 1.6456727981567383, 1.702524185180664, 1.7593756914138794, 1.8162271976470947, 1.8730785846710205, 1.9299300909042358, 1.9867814779281616, 2.043632984161377, 2.1004843711853027, 2.1573359966278076, 2.2141873836517334]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 5.0, 10.0, 12.0, 19.0, 18.0, 32.0, 55.0, 64.0, 126.0, 190.0, 305.0, 506.0, 1159.0, 7431.0, 843226.0, 190102.0, 3215.0, 951.0, 388.0, 251.0, 159.0, 98.0, 67.0, 52.0, 26.0, 23.0, 18.0, 12.0, 14.0, 4.0, 3.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.935546875, -0.9079055786132812, -0.8802642822265625, -0.8526229858398438, -0.824981689453125, -0.7973403930664062, -0.7696990966796875, -0.7420578002929688, -0.71441650390625, -0.6867752075195312, -0.6591339111328125, -0.6314926147460938, -0.603851318359375, -0.5762100219726562, -0.5485687255859375, -0.5209274291992188, -0.4932861328125, -0.46564483642578125, -0.4380035400390625, -0.41036224365234375, -0.382720947265625, -0.35507965087890625, -0.3274383544921875, -0.29979705810546875, -0.27215576171875, -0.24451446533203125, -0.2168731689453125, -0.18923187255859375, -0.161590576171875, -0.13394927978515625, -0.1063079833984375, -0.07866668701171875, -0.051025390625, -0.02338409423828125, 0.0042572021484375, 0.03189849853515625, 0.059539794921875, 0.08718109130859375, 0.1148223876953125, 0.14246368408203125, 0.17010498046875, 0.19774627685546875, 0.2253875732421875, 0.25302886962890625, 0.280670166015625, 0.30831146240234375, 0.3359527587890625, 0.36359405517578125, 0.3912353515625, 0.41887664794921875, 0.4465179443359375, 0.47415924072265625, 0.501800537109375, 0.5294418334960938, 0.5570831298828125, 0.5847244262695312, 0.61236572265625, 0.6400070190429688, 0.6676483154296875, 0.6952896118164062, 0.722930908203125, 0.7505722045898438, 0.7782135009765625, 0.8058547973632812, 0.83349609375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 5.0, 7.0, 14.0, 15.0, 12.0, 15.0, 27.0, 20.0, 35.0, 44.0, 53.0, 47.0, 65.0, 57.0, 72.0, 64.0, 55.0, 65.0, 58.0, 63.0, 47.0, 34.0, 29.0, 30.0, 21.0, 11.0, 11.0, 10.0, 8.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7744140625, -1.71929931640625, -1.6641845703125, -1.60906982421875, -1.553955078125, -1.49884033203125, -1.4437255859375, -1.38861083984375, -1.33349609375, -1.27838134765625, -1.2232666015625, -1.16815185546875, -1.113037109375, -1.05792236328125, -1.0028076171875, -0.94769287109375, -0.892578125, -0.83746337890625, -0.7823486328125, -0.72723388671875, -0.672119140625, -0.61700439453125, -0.5618896484375, -0.50677490234375, -0.45166015625, -0.39654541015625, -0.3414306640625, -0.28631591796875, -0.231201171875, -0.17608642578125, -0.1209716796875, -0.06585693359375, -0.0107421875, 0.04437255859375, 0.0994873046875, 0.15460205078125, 0.209716796875, 0.26483154296875, 0.3199462890625, 0.37506103515625, 0.43017578125, 0.48529052734375, 0.5404052734375, 0.59552001953125, 0.650634765625, 0.70574951171875, 0.7608642578125, 0.81597900390625, 0.87109375, 0.92620849609375, 0.9813232421875, 1.03643798828125, 1.091552734375, 1.14666748046875, 1.2017822265625, 1.25689697265625, 1.31201171875, 1.36712646484375, 1.4222412109375, 1.47735595703125, 1.532470703125, 1.58758544921875, 1.6427001953125, 1.69781494140625, 1.7529296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 8.0, 5.0, 3.0, 4.0, 5.0, 14.0, 12.0, 7.0, 24.0, 20.0, 32.0, 30.0, 48.0, 53.0, 84.0, 90.0, 129.0, 138.0, 218.0, 351.0, 558.0, 1521.0, 7984.0, 79778.0, 764801.0, 175249.0, 13520.0, 1907.0, 638.0, 338.0, 222.0, 199.0, 150.0, 108.0, 71.0, 60.0, 43.0, 26.0, 31.0, 29.0, 17.0, 9.0, 11.0, 10.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.32958984375, -0.32007598876953125, -0.3105621337890625, -0.30104827880859375, -0.291534423828125, -0.28202056884765625, -0.2725067138671875, -0.26299285888671875, -0.25347900390625, -0.24396514892578125, -0.2344512939453125, -0.22493743896484375, -0.215423583984375, -0.20590972900390625, -0.1963958740234375, -0.18688201904296875, -0.1773681640625, -0.16785430908203125, -0.1583404541015625, -0.14882659912109375, -0.139312744140625, -0.12979888916015625, -0.1202850341796875, -0.11077117919921875, -0.10125732421875, -0.09174346923828125, -0.0822296142578125, -0.07271575927734375, -0.063201904296875, -0.05368804931640625, -0.0441741943359375, -0.03466033935546875, -0.025146484375, -0.01563262939453125, -0.0061187744140625, 0.00339508056640625, 0.012908935546875, 0.02242279052734375, 0.0319366455078125, 0.04145050048828125, 0.05096435546875, 0.06047821044921875, 0.0699920654296875, 0.07950592041015625, 0.089019775390625, 0.09853363037109375, 0.1080474853515625, 0.11756134033203125, 0.1270751953125, 0.13658905029296875, 0.1461029052734375, 0.15561676025390625, 0.165130615234375, 0.17464447021484375, 0.1841583251953125, 0.19367218017578125, 0.20318603515625, 0.21269989013671875, 0.2222137451171875, 0.23172760009765625, 0.241241455078125, 0.25075531005859375, 0.2602691650390625, 0.26978302001953125, 0.279296875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 2.0, 7.0, 5.0, 4.0, 5.0, 5.0, 9.0, 15.0, 9.0, 13.0, 13.0, 22.0, 29.0, 22.0, 29.0, 44.0, 47.0, 35.0, 47.0, 41.0, 42.0, 31.0, 55.0, 46.0, 31.0, 53.0, 40.0, 33.0, 32.0, 37.0, 27.0, 38.0, 15.0, 24.0, 21.0, 19.0, 12.0, 11.0, 11.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.005859375, -2.913818359375, -2.82177734375, -2.729736328125, -2.6376953125, -2.545654296875, -2.45361328125, -2.361572265625, -2.26953125, -2.177490234375, -2.08544921875, -1.993408203125, -1.9013671875, -1.809326171875, -1.71728515625, -1.625244140625, -1.533203125, -1.441162109375, -1.34912109375, -1.257080078125, -1.1650390625, -1.072998046875, -0.98095703125, -0.888916015625, -0.796875, -0.704833984375, -0.61279296875, -0.520751953125, -0.4287109375, -0.336669921875, -0.24462890625, -0.152587890625, -0.060546875, 0.031494140625, 0.12353515625, 0.215576171875, 0.3076171875, 0.399658203125, 0.49169921875, 0.583740234375, 0.67578125, 0.767822265625, 0.85986328125, 0.951904296875, 1.0439453125, 1.135986328125, 1.22802734375, 1.320068359375, 1.412109375, 1.504150390625, 1.59619140625, 1.688232421875, 1.7802734375, 1.872314453125, 1.96435546875, 2.056396484375, 2.1484375, 2.240478515625, 2.33251953125, 2.424560546875, 2.5166015625, 2.608642578125, 2.70068359375, 2.792724609375, 2.884765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 7.0, 6.0, 10.0, 6.0, 12.0, 20.0, 37.0, 75.0, 186.0, 671.0, 6441.0, 1037429.0, 2890.0, 471.0, 165.0, 69.0, 19.0, 11.0, 11.0, 7.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.34814453125, -0.33930397033691406, -0.3304634094238281, -0.3216228485107422, -0.31278228759765625, -0.3039417266845703, -0.2951011657714844, -0.28626060485839844, -0.2774200439453125, -0.26857948303222656, -0.2597389221191406, -0.2508983612060547, -0.24205780029296875, -0.2332172393798828, -0.22437667846679688, -0.21553611755371094, -0.206695556640625, -0.19785499572753906, -0.18901443481445312, -0.1801738739013672, -0.17133331298828125, -0.1624927520751953, -0.15365219116210938, -0.14481163024902344, -0.1359710693359375, -0.12713050842285156, -0.11828994750976562, -0.10944938659667969, -0.10060882568359375, -0.09176826477050781, -0.08292770385742188, -0.07408714294433594, -0.06524658203125, -0.05640602111816406, -0.047565460205078125, -0.03872489929199219, -0.02988433837890625, -0.021043777465820312, -0.012203216552734375, -0.0033626556396484375, 0.0054779052734375, 0.014318466186523438, 0.023159027099609375, 0.03199958801269531, 0.04084014892578125, 0.04968070983886719, 0.058521270751953125, 0.06736183166503906, 0.076202392578125, 0.08504295349121094, 0.09388351440429688, 0.10272407531738281, 0.11156463623046875, 0.12040519714355469, 0.12924575805664062, 0.13808631896972656, 0.1469268798828125, 0.15576744079589844, 0.16460800170898438, 0.1734485626220703, 0.18228912353515625, 0.1911296844482422, 0.19997024536132812, 0.20881080627441406, 0.2176513671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 6.0, 3.0, 6.0, 8.0, 9.0, 11.0, 30.0, 44.0, 62.0, 64.0, 89.0, 116.0, 130.0, 113.0, 97.0, 56.0, 44.0, 30.0, 20.0, 14.0, 13.0, 11.0, 4.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.653764724731445e-05, -3.540609031915665e-05, -3.427453339099884e-05, -3.3142976462841034e-05, -3.201141953468323e-05, -3.087986260652542e-05, -2.9748305678367615e-05, -2.861674875020981e-05, -2.7485191822052002e-05, -2.6353634893894196e-05, -2.522207796573639e-05, -2.4090521037578583e-05, -2.2958964109420776e-05, -2.182740718126297e-05, -2.0695850253105164e-05, -1.9564293324947357e-05, -1.843273639678955e-05, -1.7301179468631744e-05, -1.6169622540473938e-05, -1.5038065612316132e-05, -1.3906508684158325e-05, -1.2774951756000519e-05, -1.1643394827842712e-05, -1.0511837899684906e-05, -9.3802809715271e-06, -8.248724043369293e-06, -7.117167115211487e-06, -5.98561018705368e-06, -4.854053258895874e-06, -3.7224963307380676e-06, -2.5909394025802612e-06, -1.4593824744224548e-06, -3.2782554626464844e-07, 8.03731381893158e-07, 1.9352883100509644e-06, 3.0668452382087708e-06, 4.198402166366577e-06, 5.3299590945243835e-06, 6.46151602268219e-06, 7.593072950839996e-06, 8.724629878997803e-06, 9.856186807155609e-06, 1.0987743735313416e-05, 1.2119300663471222e-05, 1.3250857591629028e-05, 1.4382414519786835e-05, 1.551397144794464e-05, 1.6645528376102448e-05, 1.7777085304260254e-05, 1.890864223241806e-05, 2.0040199160575867e-05, 2.1171756088733673e-05, 2.230331301689148e-05, 2.3434869945049286e-05, 2.4566426873207092e-05, 2.56979838013649e-05, 2.6829540729522705e-05, 2.796109765768051e-05, 2.9092654585838318e-05, 3.0224211513996124e-05, 3.135576844215393e-05, 3.248732537031174e-05, 3.3618882298469543e-05, 3.475043922662735e-05, 3.5881996154785156e-05]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 8.0, 7.0, 12.0, 15.0, 28.0, 30.0, 50.0, 66.0, 91.0, 123.0, 219.0, 314.0, 618.0, 1166.0, 2606.0, 6880.0, 25681.0, 762661.0, 219558.0, 18314.0, 5669.0, 2179.0, 1010.0, 487.0, 278.0, 170.0, 111.0, 79.0, 42.0, 29.0, 18.0, 16.0, 8.0, 9.0, 9.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10711669921875, -0.1034078598022461, -0.09969902038574219, -0.09599018096923828, -0.09228134155273438, -0.08857250213623047, -0.08486366271972656, -0.08115482330322266, -0.07744598388671875, -0.07373714447021484, -0.07002830505371094, -0.06631946563720703, -0.06261062622070312, -0.05890178680419922, -0.05519294738769531, -0.051484107971191406, -0.0477752685546875, -0.044066429138183594, -0.04035758972167969, -0.03664875030517578, -0.032939910888671875, -0.02923107147216797, -0.025522232055664062, -0.021813392639160156, -0.01810455322265625, -0.014395713806152344, -0.010686874389648438, -0.006978034973144531, -0.003269195556640625, 0.00043964385986328125, 0.0041484832763671875, 0.007857322692871094, 0.011566162109375, 0.015275001525878906, 0.018983840942382812, 0.02269268035888672, 0.026401519775390625, 0.03011035919189453, 0.03381919860839844, 0.037528038024902344, 0.04123687744140625, 0.044945716857910156, 0.04865455627441406, 0.05236339569091797, 0.056072235107421875, 0.05978107452392578, 0.06348991394042969, 0.0671987533569336, 0.0709075927734375, 0.0746164321899414, 0.07832527160644531, 0.08203411102294922, 0.08574295043945312, 0.08945178985595703, 0.09316062927246094, 0.09686946868896484, 0.10057830810546875, 0.10428714752197266, 0.10799598693847656, 0.11170482635498047, 0.11541366577148438, 0.11912250518798828, 0.12283134460449219, 0.1265401840209961, 0.1302490234375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 9.0, 5.0, 11.0, 26.0, 47.0, 295.0, 449.0, 78.0, 36.0, 10.0, 11.0, 7.0, 4.0, 1.0, 5.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.061279296875, -0.05953407287597656, -0.057788848876953125, -0.05604362487792969, -0.05429840087890625, -0.05255317687988281, -0.050807952880859375, -0.04906272888183594, -0.0473175048828125, -0.04557228088378906, -0.043827056884765625, -0.04208183288574219, -0.04033660888671875, -0.03859138488769531, -0.036846160888671875, -0.03510093688964844, -0.033355712890625, -0.03161048889160156, -0.029865264892578125, -0.028120040893554688, -0.02637481689453125, -0.024629592895507812, -0.022884368896484375, -0.021139144897460938, -0.0193939208984375, -0.017648696899414062, -0.015903472900390625, -0.014158248901367188, -0.01241302490234375, -0.010667800903320312, -0.008922576904296875, -0.0071773529052734375, -0.00543212890625, -0.0036869049072265625, -0.001941680908203125, -0.0001964569091796875, 0.00154876708984375, 0.0032939910888671875, 0.005039215087890625, 0.0067844390869140625, 0.0085296630859375, 0.010274887084960938, 0.012020111083984375, 0.013765335083007812, 0.01551055908203125, 0.017255783081054688, 0.019001007080078125, 0.020746231079101562, 0.022491455078125, 0.024236679077148438, 0.025981903076171875, 0.027727127075195312, 0.02947235107421875, 0.031217575073242188, 0.032962799072265625, 0.03470802307128906, 0.0364532470703125, 0.03819847106933594, 0.039943695068359375, 0.04168891906738281, 0.04343414306640625, 0.04517936706542969, 0.046924591064453125, 0.04866981506347656, 0.0504150390625]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 3.0, 12.0, 5.0, 6.0, 12.0, 21.0, 22.0, 21.0, 24.0, 32.0, 33.0, 30.0, 46.0, 51.0, 50.0, 54.0, 44.0, 60.0, 50.0, 42.0, 45.0, 38.0, 45.0, 33.0, 31.0, 28.0, 25.0, 15.0, 27.0, 16.0, 18.0, 10.0, 8.0, 7.0, 7.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1751829385757446, -1.1364110708236694, -1.0976390838623047, -1.0588672161102295, -1.0200952291488647, -0.9813233613967896, -0.9425514340400696, -0.9037795066833496, -0.8650075793266296, -0.8262356519699097, -0.7874637246131897, -0.7486917972564697, -0.7099199295043945, -0.6711479425430298, -0.6323760747909546, -0.5936041474342346, -0.5548322200775146, -0.5160602927207947, -0.4772883653640747, -0.4385164678096771, -0.39974454045295715, -0.3609726130962372, -0.3222007155418396, -0.28342878818511963, -0.24465686082839966, -0.2058849334716797, -0.1671130210161209, -0.12834110856056213, -0.08956918120384216, -0.05079725384712219, -0.012025341391563416, 0.02674657106399536, 0.06551837921142578, 0.10429029911756516, 0.14306221902370453, 0.1818341314792633, 0.22060605883598328, 0.25937798619270325, 0.29814988374710083, 0.3369218111038208, 0.37569373846054077, 0.41446566581726074, 0.4532375931739807, 0.4920094907283783, 0.5307813882827759, 0.5695533752441406, 0.6083252429962158, 0.6470971703529358, 0.6858690977096558, 0.7246410250663757, 0.7634129524230957, 0.8021848797798157, 0.8409568071365356, 0.8797286748886108, 0.9185006022453308, 0.9572725296020508, 0.9960444569587708, 1.0348163843154907, 1.073588252067566, 1.1123602390289307, 1.1511321067810059, 1.1899040937423706, 1.2286759614944458, 1.2674479484558105, 1.3062198162078857]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 1.0, 4.0, 6.0, 7.0, 11.0, 11.0, 10.0, 19.0, 24.0, 26.0, 28.0, 34.0, 29.0, 44.0, 49.0, 54.0, 53.0, 39.0, 70.0, 49.0, 54.0, 44.0, 48.0, 46.0, 42.0, 42.0, 26.0, 28.0, 27.0, 15.0, 17.0, 8.0, 11.0, 5.0, 9.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2294435501098633, -1.185463309288025, -1.1414830684661865, -1.0975029468536377, -1.0535227060317993, -1.009542465209961, -0.9655622839927673, -0.9215821027755737, -0.8776018619537354, -0.833621621131897, -0.7896414399147034, -0.7456612586975098, -0.7016810178756714, -0.657700777053833, -0.6137205958366394, -0.5697404146194458, -0.5257601737976074, -0.48177996277809143, -0.43779975175857544, -0.39381954073905945, -0.34983932971954346, -0.30585911870002747, -0.2618789076805115, -0.21789869666099548, -0.1739184856414795, -0.1299382746219635, -0.08595806360244751, -0.04197785258293152, 0.0020023584365844727, 0.045982569456100464, 0.08996278047561646, 0.13394299149513245, 0.1779230833053589, 0.22190329432487488, 0.26588350534439087, 0.30986371636390686, 0.35384392738342285, 0.39782413840293884, 0.44180434942245483, 0.4857845604419708, 0.5297647714614868, 0.5737450122833252, 0.6177251935005188, 0.6617053747177124, 0.7056856155395508, 0.7496658563613892, 0.7936460375785828, 0.8376262187957764, 0.8816064596176147, 0.9255867004394531, 0.9695668816566467, 1.0135470628738403, 1.0575273036956787, 1.101507544517517, 1.1454877853393555, 1.1894679069519043, 1.2334481477737427, 1.277428388595581, 1.3214085102081299, 1.3653887510299683, 1.4093689918518066, 1.453349232673645, 1.4973294734954834, 1.5413095951080322, 1.5852898359298706]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 12.0, 18.0, 18.0, 11.0, 24.0, 35.0, 42.0, 75.0, 106.0, 149.0, 240.0, 355.0, 598.0, 948.0, 1705.0, 2855.0, 5459.0, 11061.0, 25231.0, 69582.0, 221988.0, 419815.0, 185975.0, 58595.0, 22240.0, 9772.0, 5060.0, 2603.0, 1502.0, 890.0, 548.0, 309.0, 215.0, 153.0, 96.0, 70.0, 58.0, 27.0, 24.0, 29.0, 8.0, 14.0, 13.0, 6.0, 7.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.650390625, -1.5902099609375, -1.530029296875, -1.4698486328125, -1.40966796875, -1.3494873046875, -1.289306640625, -1.2291259765625, -1.1689453125, -1.1087646484375, -1.048583984375, -0.9884033203125, -0.92822265625, -0.8680419921875, -0.807861328125, -0.7476806640625, -0.6875, -0.6273193359375, -0.567138671875, -0.5069580078125, -0.44677734375, -0.3865966796875, -0.326416015625, -0.2662353515625, -0.2060546875, -0.1458740234375, -0.085693359375, -0.0255126953125, 0.03466796875, 0.0948486328125, 0.155029296875, 0.2152099609375, 0.275390625, 0.3355712890625, 0.395751953125, 0.4559326171875, 0.51611328125, 0.5762939453125, 0.636474609375, 0.6966552734375, 0.7568359375, 0.8170166015625, 0.877197265625, 0.9373779296875, 0.99755859375, 1.0577392578125, 1.117919921875, 1.1781005859375, 1.23828125, 1.2984619140625, 1.358642578125, 1.4188232421875, 1.47900390625, 1.5391845703125, 1.599365234375, 1.6595458984375, 1.7197265625, 1.7799072265625, 1.840087890625, 1.9002685546875, 1.96044921875, 2.0206298828125, 2.080810546875, 2.1409912109375, 2.201171875]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 5.0, 2.0, 2.0, 4.0, 13.0, 21.0, 17.0, 22.0, 22.0, 24.0, 31.0, 43.0, 47.0, 49.0, 49.0, 56.0, 60.0, 49.0, 72.0, 60.0, 62.0, 40.0, 39.0, 31.0, 45.0, 33.0, 27.0, 17.0, 12.0, 11.0, 9.0, 8.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.655426025390625, -2.57061767578125, -2.485809326171875, -2.4010009765625, -2.316192626953125, -2.23138427734375, -2.146575927734375, -2.061767578125, -1.976959228515625, -1.89215087890625, -1.807342529296875, -1.7225341796875, -1.637725830078125, -1.55291748046875, -1.468109130859375, -1.38330078125, -1.298492431640625, -1.21368408203125, -1.128875732421875, -1.0440673828125, -0.959259033203125, -0.87445068359375, -0.789642333984375, -0.704833984375, -0.620025634765625, -0.53521728515625, -0.450408935546875, -0.3656005859375, -0.280792236328125, -0.19598388671875, -0.111175537109375, -0.0263671875, 0.058441162109375, 0.14324951171875, 0.228057861328125, 0.3128662109375, 0.397674560546875, 0.48248291015625, 0.567291259765625, 0.652099609375, 0.736907958984375, 0.82171630859375, 0.906524658203125, 0.9913330078125, 1.076141357421875, 1.16094970703125, 1.245758056640625, 1.33056640625, 1.415374755859375, 1.50018310546875, 1.584991455078125, 1.6697998046875, 1.754608154296875, 1.83941650390625, 1.924224853515625, 2.009033203125, 2.093841552734375, 2.17864990234375, 2.263458251953125, 2.3482666015625, 2.433074951171875, 2.51788330078125, 2.602691650390625, 2.6875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 5.0, 7.0, 4.0, 13.0, 23.0, 12.0, 22.0, 41.0, 61.0, 81.0, 112.0, 163.0, 237.0, 462.0, 718.0, 1213.0, 2235.0, 4181.0, 9062.0, 22308.0, 73534.0, 328652.0, 445536.0, 108160.0, 29237.0, 11194.0, 5033.0, 2606.0, 1420.0, 796.0, 472.0, 292.0, 206.0, 128.0, 102.0, 79.0, 43.0, 44.0, 16.0, 16.0, 7.0, 5.0, 5.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.274139404296875, -2.19866943359375, -2.123199462890625, -2.0477294921875, -1.972259521484375, -1.89678955078125, -1.821319580078125, -1.745849609375, -1.670379638671875, -1.59490966796875, -1.519439697265625, -1.4439697265625, -1.368499755859375, -1.29302978515625, -1.217559814453125, -1.14208984375, -1.066619873046875, -0.99114990234375, -0.915679931640625, -0.8402099609375, -0.764739990234375, -0.68927001953125, -0.613800048828125, -0.538330078125, -0.462860107421875, -0.38739013671875, -0.311920166015625, -0.2364501953125, -0.160980224609375, -0.08551025390625, -0.010040283203125, 0.0654296875, 0.140899658203125, 0.21636962890625, 0.291839599609375, 0.3673095703125, 0.442779541015625, 0.51824951171875, 0.593719482421875, 0.669189453125, 0.744659423828125, 0.82012939453125, 0.895599365234375, 0.9710693359375, 1.046539306640625, 1.12200927734375, 1.197479248046875, 1.27294921875, 1.348419189453125, 1.42388916015625, 1.499359130859375, 1.5748291015625, 1.650299072265625, 1.72576904296875, 1.801239013671875, 1.876708984375, 1.952178955078125, 2.02764892578125, 2.103118896484375, 2.1785888671875, 2.254058837890625, 2.32952880859375, 2.404998779296875, 2.48046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 5.0, 6.0, 13.0, 10.0, 8.0, 20.0, 18.0, 22.0, 31.0, 38.0, 38.0, 37.0, 44.0, 40.0, 34.0, 47.0, 53.0, 49.0, 47.0, 56.0, 43.0, 47.0, 47.0, 42.0, 30.0, 35.0, 20.0, 16.0, 18.0, 20.0, 16.0, 10.0, 8.0, 9.0, 6.0, 4.0, 0.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.998046875, -2.896484375, -2.794921875, -2.693359375, -2.591796875, -2.490234375, -2.388671875, -2.287109375, -2.185546875, -2.083984375, -1.982421875, -1.880859375, -1.779296875, -1.677734375, -1.576171875, -1.474609375, -1.373046875, -1.271484375, -1.169921875, -1.068359375, -0.966796875, -0.865234375, -0.763671875, -0.662109375, -0.560546875, -0.458984375, -0.357421875, -0.255859375, -0.154296875, -0.052734375, 0.048828125, 0.150390625, 0.251953125, 0.353515625, 0.455078125, 0.556640625, 0.658203125, 0.759765625, 0.861328125, 0.962890625, 1.064453125, 1.166015625, 1.267578125, 1.369140625, 1.470703125, 1.572265625, 1.673828125, 1.775390625, 1.876953125, 1.978515625, 2.080078125, 2.181640625, 2.283203125, 2.384765625, 2.486328125, 2.587890625, 2.689453125, 2.791015625, 2.892578125, 2.994140625, 3.095703125, 3.197265625, 3.298828125, 3.400390625, 3.501953125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 5.0, 9.0, 15.0, 19.0, 14.0, 36.0, 55.0, 65.0, 70.0, 111.0, 156.0, 195.0, 300.0, 407.0, 587.0, 833.0, 1342.0, 2218.0, 4032.0, 8866.0, 23084.0, 70107.0, 239180.0, 467579.0, 152590.0, 45207.0, 16063.0, 6743.0, 3220.0, 1844.0, 1089.0, 688.0, 487.0, 342.0, 254.0, 190.0, 133.0, 106.0, 81.0, 64.0, 49.0, 35.0, 24.0, 19.0, 8.0, 10.0, 8.0, 4.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.6474609375, -0.6267852783203125, -0.606109619140625, -0.5854339599609375, -0.56475830078125, -0.5440826416015625, -0.523406982421875, -0.5027313232421875, -0.4820556640625, -0.4613800048828125, -0.440704345703125, -0.4200286865234375, -0.39935302734375, -0.3786773681640625, -0.358001708984375, -0.3373260498046875, -0.316650390625, -0.2959747314453125, -0.275299072265625, -0.2546234130859375, -0.23394775390625, -0.2132720947265625, -0.192596435546875, -0.1719207763671875, -0.1512451171875, -0.1305694580078125, -0.109893798828125, -0.0892181396484375, -0.06854248046875, -0.0478668212890625, -0.027191162109375, -0.0065155029296875, 0.01416015625, 0.0348358154296875, 0.055511474609375, 0.0761871337890625, 0.09686279296875, 0.1175384521484375, 0.138214111328125, 0.1588897705078125, 0.1795654296875, 0.2002410888671875, 0.220916748046875, 0.2415924072265625, 0.26226806640625, 0.2829437255859375, 0.303619384765625, 0.3242950439453125, 0.344970703125, 0.3656463623046875, 0.386322021484375, 0.4069976806640625, 0.42767333984375, 0.4483489990234375, 0.469024658203125, 0.4897003173828125, 0.5103759765625, 0.5310516357421875, 0.551727294921875, 0.5724029541015625, 0.59307861328125, 0.6137542724609375, 0.634429931640625, 0.6551055908203125, 0.67578125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 3.0, 7.0, 7.0, 5.0, 7.0, 13.0, 13.0, 33.0, 51.0, 58.0, 83.0, 105.0, 171.0, 118.0, 85.0, 67.0, 59.0, 35.0, 26.0, 20.0, 14.0, 8.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014925003051757812, -0.00014317035675048828, -0.00013709068298339844, -0.0001310110092163086, -0.00012493133544921875, -0.0001188516616821289, -0.00011277198791503906, -0.00010669231414794922, -0.00010061264038085938, -9.453296661376953e-05, -8.845329284667969e-05, -8.237361907958984e-05, -7.62939453125e-05, -7.021427154541016e-05, -6.413459777832031e-05, -5.805492401123047e-05, -5.1975250244140625e-05, -4.589557647705078e-05, -3.981590270996094e-05, -3.3736228942871094e-05, -2.765655517578125e-05, -2.1576881408691406e-05, -1.5497207641601562e-05, -9.417533874511719e-06, -3.337860107421875e-06, 2.7418136596679688e-06, 8.821487426757812e-06, 1.4901161193847656e-05, 2.09808349609375e-05, 2.7060508728027344e-05, 3.314018249511719e-05, 3.921985626220703e-05, 4.5299530029296875e-05, 5.137920379638672e-05, 5.745887756347656e-05, 6.35385513305664e-05, 6.961822509765625e-05, 7.56978988647461e-05, 8.177757263183594e-05, 8.785724639892578e-05, 9.393692016601562e-05, 0.00010001659393310547, 0.00010609626770019531, 0.00011217594146728516, 0.000118255615234375, 0.00012433528900146484, 0.0001304149627685547, 0.00013649463653564453, 0.00014257431030273438, 0.00014865398406982422, 0.00015473365783691406, 0.0001608133316040039, 0.00016689300537109375, 0.0001729726791381836, 0.00017905235290527344, 0.00018513202667236328, 0.00019121170043945312, 0.00019729137420654297, 0.0002033710479736328, 0.00020945072174072266, 0.0002155303955078125, 0.00022161006927490234, 0.0002276897430419922, 0.00023376941680908203, 0.00023984909057617188]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 4.0, 8.0, 10.0, 11.0, 11.0, 23.0, 31.0, 31.0, 30.0, 40.0, 75.0, 89.0, 116.0, 165.0, 260.0, 389.0, 574.0, 1020.0, 1894.0, 4426.0, 12209.0, 45568.0, 229892.0, 574124.0, 132804.0, 28826.0, 8575.0, 3328.0, 1557.0, 821.0, 478.0, 339.0, 233.0, 136.0, 120.0, 72.0, 65.0, 48.0, 32.0, 32.0, 22.0, 17.0, 15.0, 15.0, 6.0, 4.0, 6.0, 2.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94140625, -0.9093170166015625, -0.877227783203125, -0.8451385498046875, -0.81304931640625, -0.7809600830078125, -0.748870849609375, -0.7167816162109375, -0.6846923828125, -0.6526031494140625, -0.620513916015625, -0.5884246826171875, -0.55633544921875, -0.5242462158203125, -0.492156982421875, -0.4600677490234375, -0.427978515625, -0.3958892822265625, -0.363800048828125, -0.3317108154296875, -0.29962158203125, -0.2675323486328125, -0.235443115234375, -0.2033538818359375, -0.1712646484375, -0.1391754150390625, -0.107086181640625, -0.0749969482421875, -0.04290771484375, -0.0108184814453125, 0.021270751953125, 0.0533599853515625, 0.08544921875, 0.1175384521484375, 0.149627685546875, 0.1817169189453125, 0.21380615234375, 0.2458953857421875, 0.277984619140625, 0.3100738525390625, 0.3421630859375, 0.3742523193359375, 0.406341552734375, 0.4384307861328125, 0.47052001953125, 0.5026092529296875, 0.534698486328125, 0.5667877197265625, 0.598876953125, 0.6309661865234375, 0.663055419921875, 0.6951446533203125, 0.72723388671875, 0.7593231201171875, 0.791412353515625, 0.8235015869140625, 0.8555908203125, 0.8876800537109375, 0.919769287109375, 0.9518585205078125, 0.98394775390625, 1.0160369873046875, 1.048126220703125, 1.0802154541015625, 1.1123046875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 6.0, 11.0, 13.0, 24.0, 35.0, 63.0, 78.0, 104.0, 189.0, 149.0, 97.0, 75.0, 44.0, 39.0, 25.0, 15.0, 13.0, 10.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8505859375, -0.8261947631835938, -0.8018035888671875, -0.7774124145507812, -0.753021240234375, -0.7286300659179688, -0.7042388916015625, -0.6798477172851562, -0.65545654296875, -0.6310653686523438, -0.6066741943359375, -0.5822830200195312, -0.557891845703125, -0.5335006713867188, -0.5091094970703125, -0.48471832275390625, -0.4603271484375, -0.43593597412109375, -0.4115447998046875, -0.38715362548828125, -0.362762451171875, -0.33837127685546875, -0.3139801025390625, -0.28958892822265625, -0.26519775390625, -0.24080657958984375, -0.2164154052734375, -0.19202423095703125, -0.167633056640625, -0.14324188232421875, -0.1188507080078125, -0.09445953369140625, -0.070068359375, -0.04567718505859375, -0.0212860107421875, 0.00310516357421875, 0.027496337890625, 0.05188751220703125, 0.0762786865234375, 0.10066986083984375, 0.12506103515625, 0.14945220947265625, 0.1738433837890625, 0.19823455810546875, 0.222625732421875, 0.24701690673828125, 0.2714080810546875, 0.29579925537109375, 0.3201904296875, 0.34458160400390625, 0.3689727783203125, 0.39336395263671875, 0.417755126953125, 0.44214630126953125, 0.4665374755859375, 0.49092864990234375, 0.51531982421875, 0.5397109985351562, 0.5641021728515625, 0.5884933471679688, 0.612884521484375, 0.6372756958007812, 0.6616668701171875, 0.6860580444335938, 0.71044921875]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 12.0, 27.0, 45.0, 93.0, 143.0, 180.0, 164.0, 126.0, 93.0, 51.0, 29.0, 13.0, 7.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.819700002670288, -2.505915641784668, -2.192131280899048, -1.8783470392227173, -1.5645626783370972, -1.250778317451477, -0.9369940757751465, -0.6232097148895264, -0.30942535400390625, 0.0043589770793914795, 0.3181433081626892, 0.6319276094436646, 0.9457119703292847, 1.2594963312149048, 1.5732805728912354, 1.8870649337768555, 2.2008492946624756, 2.5146336555480957, 2.828418016433716, 3.142202377319336, 3.455986499786377, 3.769771099090576, 4.083555221557617, 4.397339820861816, 4.711123943328857, 5.024908065795898, 5.338692665100098, 5.652476787567139, 5.966261386871338, 6.280045509338379, 6.593830108642578, 6.907614231109619, 7.22139835357666, 7.535182476043701, 7.8489670753479, 8.162751197814941, 8.47653579711914, 8.79032039642334, 9.104104042053223, 9.417888641357422, 9.731673240661621, 10.04545783996582, 10.359241485595703, 10.673026084899902, 10.986810684204102, 11.3005952835083, 11.614378929138184, 11.928163528442383, 12.241947174072266, 12.555731773376465, 12.869515419006348, 13.183300018310547, 13.497084617614746, 13.810869216918945, 14.124652862548828, 14.438437461853027, 14.752222061157227, 15.066006660461426, 15.379790306091309, 15.693574905395508, 16.00735855102539, 16.321144104003906, 16.63492774963379, 16.948711395263672, 17.262496948242188]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 10.0, 10.0, 11.0, 10.0, 27.0, 18.0, 17.0, 20.0, 35.0, 34.0, 30.0, 43.0, 46.0, 37.0, 36.0, 35.0, 42.0, 48.0, 42.0, 46.0, 40.0, 36.0, 44.0, 30.0, 46.0, 31.0, 32.0, 30.0, 18.0, 20.0, 21.0, 9.0, 15.0, 5.0, 3.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.205555438995361, -5.030652046203613, -4.855748176574707, -4.680844783782959, -4.505941390991211, -4.331037521362305, -4.156134128570557, -3.9812304973602295, -3.8063268661499023, -3.631423234939575, -3.456519603729248, -3.2816162109375, -3.106712579727173, -2.9318089485168457, -2.7569055557250977, -2.5820019245147705, -2.4070982933044434, -2.232194662094116, -2.057291030883789, -1.882387638092041, -1.7074840068817139, -1.5325803756713867, -1.3576768636703491, -1.1827733516693115, -1.0078697204589844, -0.832966148853302, -0.6580625772476196, -0.48315900564193726, -0.3082554340362549, -0.1333518624305725, 0.04155170917510986, 0.21645522117614746, 0.3913588523864746, 0.566262423992157, 0.7411659955978394, 0.9160695672035217, 1.090973138809204, 1.2658767700195312, 1.4407802820205688, 1.6156837940216064, 1.7905874252319336, 1.9654910564422607, 2.140394687652588, 2.315298080444336, 2.490201711654663, 2.6651053428649902, 2.8400087356567383, 3.0149123668670654, 3.1898159980773926, 3.3647196292877197, 3.539623260498047, 3.714526653289795, 3.889430284500122, 4.064333915710449, 4.239237308502197, 4.414140701293945, 4.589044570922852, 4.7639479637146, 4.938851833343506, 5.113755226135254, 5.28865909576416, 5.463562488555908, 5.638465881347656, 5.8133697509765625, 5.9882731437683105]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 7.0, 5.0, 2.0, 9.0, 8.0, 12.0, 20.0, 27.0, 23.0, 39.0, 49.0, 57.0, 92.0, 107.0, 140.0, 203.0, 307.0, 440.0, 714.0, 956.0, 1323.0, 1691.0, 2826.0, 1034716.0, 1906.0, 1400.0, 1047.0, 743.0, 482.0, 353.0, 239.0, 167.0, 122.0, 102.0, 58.0, 44.0, 43.0, 27.0, 26.0, 17.0, 23.0, 7.0, 9.0, 8.0, 4.0, 5.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.112381935119629, -5.909613609313965, -5.706845283508301, -5.504076957702637, -5.301308631896973, -5.098540306091309, -4.895771503448486, -4.693003177642822, -4.490234851837158, -4.287466526031494, -4.08469820022583, -3.881929636001587, -3.679161310195923, -3.476392984390259, -3.2736244201660156, -3.0708560943603516, -2.8680877685546875, -2.6653194427490234, -2.4625511169433594, -2.259782552719116, -2.057014226913452, -1.854245901107788, -1.6514774560928345, -1.4487090110778809, -1.2459406852722168, -1.0431723594665527, -0.8404039144515991, -0.6376355290412903, -0.43486714363098145, -0.23209881782531738, -0.02933037281036377, 0.17343807220458984, 0.3762059211730957, 0.5789743065834045, 0.7817426919937134, 0.9845110774040222, 1.187279462814331, 1.3900477886199951, 1.5928162336349487, 1.7955846786499023, 1.9983530044555664, 2.2011213302612305, 2.4038896560668945, 2.6066582202911377, 2.8094265460968018, 3.012194871902466, 3.214963436126709, 3.417731761932373, 3.620500087738037, 3.823268413543701, 4.026036739349365, 4.228805065155029, 4.431573867797852, 4.634342193603516, 4.83711051940918, 5.039878845214844, 5.242647171020508, 5.445415496826172, 5.648183822631836, 5.8509521484375, 6.053720474243164, 6.256488800048828, 6.45925760269165, 6.6620259284973145, 6.8647942543029785]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 10.0, 15.0, 21.0, 51.0, 96.0, 137.0, 312.0, 749.0, 2594.0, 12733.0, 51424808.0, 23009.0, 4648.0, 1268.0, 455.0, 209.0, 103.0, 50.0, 26.0, 17.0, 11.0, 7.0, 3.0, 6.0, 4.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-20.0030460357666, -19.40827178955078, -18.81349754333496, -18.21872329711914, -17.62394905090332, -17.0291748046875, -16.43440055847168, -15.839627265930176, -15.244853019714355, -14.650078773498535, -14.055304527282715, -13.460530281066895, -12.86575698852539, -12.27098274230957, -11.67620849609375, -11.08143424987793, -10.48666000366211, -9.891885757446289, -9.297111511230469, -8.702337265014648, -8.107563018798828, -7.512789249420166, -6.918015480041504, -6.323241233825684, -5.728466987609863, -5.133692741394043, -4.538918495178223, -3.9441447257995605, -3.3493704795837402, -2.75459623336792, -2.1598222255706787, -1.5650482177734375, -0.9702720642089844, -0.3754979372024536, 0.21927618980407715, 0.8140503168106079, 1.4088244438171387, 2.003598690032959, 2.5983726978302, 3.1931467056274414, 3.7879209518432617, 4.382695198059082, 4.977469444274902, 5.5722432136535645, 6.167017459869385, 6.761791706085205, 7.356565475463867, 7.9513397216796875, 8.546113967895508, 9.140888214111328, 9.735662460327148, 10.330436706542969, 10.925210952758789, 11.51998519897461, 12.114758491516113, 12.709532737731934, 13.304306983947754, 13.899081230163574, 14.493855476379395, 15.088629722595215, 15.683403015136719, 16.27817726135254, 16.87295150756836, 17.46772575378418, 18.0625]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 7.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 30.0, 35.0, 39.0, 42.0, 72.0, 150.0, 237.0, 401.0, 665.0, 1323.0, 3118.0, 8415.0, 30780.0, 151851.0, 872771.0, 4738461.0, 388199.0, 69309.0, 16079.0, 4999.0, 2093.0, 987.0, 544.0, 324.0, 156.0, 115.0, 85.0, 34.0, 22.0, 19.0, 14.0, 13.0, 2.0, 3.0, 5.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.39990234375, -0.3875083923339844, -0.37511444091796875, -0.3627204895019531, -0.3503265380859375, -0.3379325866699219, -0.32553863525390625, -0.3131446838378906, -0.300750732421875, -0.2883567810058594, -0.27596282958984375, -0.2635688781738281, -0.2511749267578125, -0.23878097534179688, -0.22638702392578125, -0.21399307250976562, -0.20159912109375, -0.18920516967773438, -0.17681121826171875, -0.16441726684570312, -0.1520233154296875, -0.13962936401367188, -0.12723541259765625, -0.11484146118164062, -0.102447509765625, -0.09005355834960938, -0.07765960693359375, -0.06526565551757812, -0.0528717041015625, -0.040477752685546875, -0.02808380126953125, -0.015689849853515625, -0.0032958984375, 0.009098052978515625, 0.02149200439453125, 0.033885955810546875, 0.0462799072265625, 0.058673858642578125, 0.07106781005859375, 0.08346176147460938, 0.095855712890625, 0.10824966430664062, 0.12064361572265625, 0.13303756713867188, 0.1454315185546875, 0.15782546997070312, 0.17021942138671875, 0.18261337280273438, 0.19500732421875, 0.20740127563476562, 0.21979522705078125, 0.23218917846679688, 0.2445831298828125, 0.2569770812988281, 0.26937103271484375, 0.2817649841308594, 0.294158935546875, 0.3065528869628906, 0.31894683837890625, 0.3313407897949219, 0.3437347412109375, 0.3561286926269531, 0.36852264404296875, 0.3809165954589844, 0.393310546875]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 8.0, 8.0, 12.0, 20.0, 17.0, 19.0, 24.0, 29.0, 43.0, 40.0, 39.0, 45.0, 44.0, 61.0, 77.0, 1080.0, 45.0, 45.0, 52.0, 52.0, 48.0, 36.0, 27.0, 21.0, 25.0, 28.0, 25.0, 7.0, 14.0, 12.0, 3.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.828125, -9.46728515625, -9.1064453125, -8.74560546875, -8.384765625, -8.02392578125, -7.6630859375, -7.30224609375, -6.94140625, -6.58056640625, -6.2197265625, -5.85888671875, -5.498046875, -5.13720703125, -4.7763671875, -4.41552734375, -4.0546875, -3.69384765625, -3.3330078125, -2.97216796875, -2.611328125, -2.25048828125, -1.8896484375, -1.52880859375, -1.16796875, -0.80712890625, -0.4462890625, -0.08544921875, 0.275390625, 0.63623046875, 0.9970703125, 1.35791015625, 1.71875, 2.07958984375, 2.4404296875, 2.80126953125, 3.162109375, 3.52294921875, 3.8837890625, 4.24462890625, 4.60546875, 4.96630859375, 5.3271484375, 5.68798828125, 6.048828125, 6.40966796875, 6.7705078125, 7.13134765625, 7.4921875, 7.85302734375, 8.2138671875, 8.57470703125, 8.935546875, 9.29638671875, 9.6572265625, 10.01806640625, 10.37890625, 10.73974609375, 11.1005859375, 11.46142578125, 11.822265625, 12.18310546875, 12.5439453125, 12.90478515625, 13.265625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 3.0, 6.0, 1.0, 1.0, 2.0, 1.0, 8.0, 12.0, 19.0, 14.0, 29.0, 59.0, 120.0, 176.0, 258.0, 512.0, 905.0, 1967.0, 6335.0, 34194.0, 280182.0, 4873824.0, 957666.0, 112277.0, 16057.0, 3769.0, 1378.0, 682.0, 398.0, 193.0, 127.0, 103.0, 45.0, 32.0, 19.0, 24.0, 5.0, 5.0, 5.0, 7.0, 1.0, 1.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30517578125, -0.29334259033203125, -0.2815093994140625, -0.26967620849609375, -0.257843017578125, -0.24600982666015625, -0.2341766357421875, -0.22234344482421875, -0.21051025390625, -0.19867706298828125, -0.1868438720703125, -0.17501068115234375, -0.163177490234375, -0.15134429931640625, -0.1395111083984375, -0.12767791748046875, -0.1158447265625, -0.10401153564453125, -0.0921783447265625, -0.08034515380859375, -0.068511962890625, -0.05667877197265625, -0.0448455810546875, -0.03301239013671875, -0.02117919921875, -0.00934600830078125, 0.0024871826171875, 0.01432037353515625, 0.026153564453125, 0.03798675537109375, 0.0498199462890625, 0.06165313720703125, 0.073486328125, 0.08531951904296875, 0.0971527099609375, 0.10898590087890625, 0.120819091796875, 0.13265228271484375, 0.1444854736328125, 0.15631866455078125, 0.16815185546875, 0.17998504638671875, 0.1918182373046875, 0.20365142822265625, 0.215484619140625, 0.22731781005859375, 0.2391510009765625, 0.25098419189453125, 0.2628173828125, 0.27465057373046875, 0.2864837646484375, 0.29831695556640625, 0.310150146484375, 0.32198333740234375, 0.3338165283203125, 0.34564971923828125, 0.35748291015625, 0.36931610107421875, 0.3811492919921875, 0.39298248291015625, 0.404815673828125, 0.41664886474609375, 0.4284820556640625, 0.44031524658203125, 0.4521484375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 10.0, 13.0, 14.0, 12.0, 9.0, 24.0, 24.0, 29.0, 28.0, 34.0, 35.0, 37.0, 51.0, 34.0, 45.0, 27.0, 610.0, 489.0, 42.0, 43.0, 41.0, 38.0, 35.0, 36.0, 41.0, 27.0, 26.0, 29.0, 24.0, 22.0, 12.0, 15.0, 6.0, 13.0, 8.0, 5.0, 4.0, 5.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-8.25, -8.01422119140625, -7.7784423828125, -7.54266357421875, -7.306884765625, -7.07110595703125, -6.8353271484375, -6.59954833984375, -6.36376953125, -6.12799072265625, -5.8922119140625, -5.65643310546875, -5.420654296875, -5.18487548828125, -4.9490966796875, -4.71331787109375, -4.4775390625, -4.24176025390625, -4.0059814453125, -3.77020263671875, -3.534423828125, -3.29864501953125, -3.0628662109375, -2.82708740234375, -2.59130859375, -2.35552978515625, -2.1197509765625, -1.88397216796875, -1.648193359375, -1.41241455078125, -1.1766357421875, -0.94085693359375, -0.705078125, -0.46929931640625, -0.2335205078125, 0.00225830078125, 0.238037109375, 0.47381591796875, 0.7095947265625, 0.94537353515625, 1.18115234375, 1.41693115234375, 1.6527099609375, 1.88848876953125, 2.124267578125, 2.36004638671875, 2.5958251953125, 2.83160400390625, 3.0673828125, 3.30316162109375, 3.5389404296875, 3.77471923828125, 4.010498046875, 4.24627685546875, 4.4820556640625, 4.71783447265625, 4.95361328125, 5.18939208984375, 5.4251708984375, 5.66094970703125, 5.896728515625, 6.13250732421875, 6.3682861328125, 6.60406494140625, 6.83984375]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 7.0, 3.0, 2.0, 1.0, 6.0, 8.0, 5.0, 4.0, 6.0, 13.0, 32.0, 42.0, 67.0, 183.0, 400.0, 1054.0, 3202.0, 17198.0, 6162274.0, 98199.0, 5709.0, 1623.0, 677.0, 286.0, 145.0, 84.0, 68.0, 40.0, 36.0, 21.0, 16.0, 6.0, 7.0, 6.0, 4.0, 2.0], "bins": [-1.9306640625, -1.8893356323242188, -1.8480072021484375, -1.8066787719726562, -1.765350341796875, -1.7240219116210938, -1.6826934814453125, -1.6413650512695312, -1.60003662109375, -1.5587081909179688, -1.5173797607421875, -1.4760513305664062, -1.434722900390625, -1.3933944702148438, -1.3520660400390625, -1.3107376098632812, -1.2694091796875, -1.2280807495117188, -1.1867523193359375, -1.1454238891601562, -1.104095458984375, -1.0627670288085938, -1.0214385986328125, -0.9801101684570312, -0.93878173828125, -0.8974533081054688, -0.8561248779296875, -0.8147964477539062, -0.773468017578125, -0.7321395874023438, -0.6908111572265625, -0.6494827270507812, -0.608154296875, -0.5668258666992188, -0.5254974365234375, -0.48416900634765625, -0.442840576171875, -0.40151214599609375, -0.3601837158203125, -0.31885528564453125, -0.27752685546875, -0.23619842529296875, -0.1948699951171875, -0.15354156494140625, -0.112213134765625, -0.07088470458984375, -0.0295562744140625, 0.01177215576171875, 0.0531005859375, 0.09442901611328125, 0.1357574462890625, 0.17708587646484375, 0.218414306640625, 0.25974273681640625, 0.3010711669921875, 0.34239959716796875, 0.38372802734375, 0.42505645751953125, 0.4663848876953125, 0.5077133178710938, 0.549041748046875, 0.5903701782226562, 0.6316986083984375, 0.6730270385742188, 0.71435546875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 7.0, 17.0, 39.0, 57.0, 81.0, 80.0, 125.0, 1163.0, 135.0, 93.0, 83.0, 58.0, 44.0, 25.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.86328125, -7.39080810546875, -6.9183349609375, -6.44586181640625, -5.973388671875, -5.50091552734375, -5.0284423828125, -4.55596923828125, -4.08349609375, -3.61102294921875, -3.1385498046875, -2.66607666015625, -2.193603515625, -1.72113037109375, -1.2486572265625, -0.77618408203125, -0.3037109375, 0.16876220703125, 0.6412353515625, 1.11370849609375, 1.586181640625, 2.05865478515625, 2.5311279296875, 3.00360107421875, 3.47607421875, 3.94854736328125, 4.4210205078125, 4.89349365234375, 5.365966796875, 5.83843994140625, 6.3109130859375, 6.78338623046875, 7.255859375, 7.72833251953125, 8.2008056640625, 8.67327880859375, 9.145751953125, 9.61822509765625, 10.0906982421875, 10.56317138671875, 11.03564453125, 11.50811767578125, 11.9805908203125, 12.45306396484375, 12.925537109375, 13.39801025390625, 13.8704833984375, 14.34295654296875, 14.8154296875, 15.28790283203125, 15.7603759765625, 16.23284912109375, 16.705322265625, 17.17779541015625, 17.6502685546875, 18.12274169921875, 18.59521484375, 19.06768798828125, 19.5401611328125, 20.01263427734375, 20.485107421875, 20.95758056640625, 21.4300537109375, 21.90252685546875, 22.375]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 13.0, 672.0, 307.0, 13.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.86222839355469, -50.89992141723633, -49.937618255615234, -48.975311279296875, -48.013004302978516, -47.050697326660156, -46.08839416503906, -45.1260871887207, -44.163780212402344, -43.201473236083984, -42.23917007446289, -41.27686309814453, -40.31455612182617, -39.35224914550781, -38.38994598388672, -37.42763900756836, -36.465335845947266, -35.503028869628906, -34.54072570800781, -33.57841873168945, -32.616111755371094, -31.653806686401367, -30.69150161743164, -29.72919464111328, -28.766887664794922, -27.804582595825195, -26.842275619506836, -25.87997055053711, -24.91766357421875, -23.955358505249023, -22.993053436279297, -22.030746459960938, -21.068439483642578, -20.10613441467285, -19.143827438354492, -18.181522369384766, -17.219215393066406, -16.25691032409668, -15.294604301452637, -14.332298278808594, -13.369993209838867, -12.407687187194824, -11.445381164550781, -10.483076095581055, -9.520770072937012, -8.558464050292969, -7.596158027648926, -6.633852481842041, -5.671546936035156, -4.709240913391113, -3.7469353675842285, -2.7846293449401855, -1.8223235607147217, -0.8600177764892578, 0.10228824615478516, 1.06459379196167, 2.026899814605713, 2.9892055988311768, 3.9515113830566406, 4.913817405700684, 5.876123428344727, 6.838428974151611, 7.800734996795654, 8.763040542602539, 9.725346565246582]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 6.0, 14.0, 27.0, 65.0, 83.0, 117.0, 144.0, 152.0, 145.0, 105.0, 75.0, 31.0, 21.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.46249771118164, -30.51834487915039, -29.57419204711914, -28.630041122436523, -27.685888290405273, -26.741735458374023, -25.797584533691406, -24.853431701660156, -23.909278869628906, -22.965126037597656, -22.020973205566406, -21.07682228088379, -20.13266944885254, -19.18851661682129, -18.244365692138672, -17.300212860107422, -16.356060028076172, -15.411907196044922, -14.467755317687988, -13.523603439331055, -12.579450607299805, -11.635297775268555, -10.691145896911621, -9.746994018554688, -8.802841186523438, -7.858688831329346, -6.914536476135254, -5.970384120941162, -5.02623176574707, -4.0820794105529785, -3.1379270553588867, -2.193774700164795, -1.249624252319336, -0.30547189712524414, 0.6386804580688477, 1.5828328132629395, 2.5269851684570312, 3.471137523651123, 4.415289878845215, 5.359442234039307, 6.303594589233398, 7.24774694442749, 8.191899299621582, 9.136051177978516, 10.080204010009766, 11.024356842041016, 11.96850872039795, 12.912660598754883, 13.856813430786133, 14.800966262817383, 15.745118141174316, 16.68927001953125, 17.6334228515625, 18.57757568359375, 19.521728515625, 20.465879440307617, 21.410032272338867, 22.354185104370117, 23.298336029052734, 24.242488861083984, 25.186641693115234, 26.130794525146484, 27.074947357177734, 28.01909828186035, 28.9632511138916]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 7.0, 9.0, 15.0, 30.0, 68.0, 5306.0, 3721.0, 12511.0, 4113097.0, 52116.0, 6381.0, 849.0, 73.0, 42.0, 16.0, 15.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0312042236328125, -0.03007340431213379, -0.028942584991455078, -0.027811765670776367, -0.026680946350097656, -0.025550127029418945, -0.024419307708740234, -0.023288488388061523, -0.022157669067382812, -0.0210268497467041, -0.01989603042602539, -0.01876521110534668, -0.01763439178466797, -0.016503572463989258, -0.015372753143310547, -0.014241933822631836, -0.013111114501953125, -0.011980295181274414, -0.010849475860595703, -0.009718656539916992, -0.008587837219238281, -0.00745701789855957, -0.006326198577880859, -0.0051953792572021484, -0.0040645599365234375, -0.0029337406158447266, -0.0018029212951660156, -0.0006721019744873047, 0.00045871734619140625, 0.0015895366668701172, 0.002720355987548828, 0.003851175308227539, 0.00498199462890625, 0.006112813949584961, 0.007243633270263672, 0.008374452590942383, 0.009505271911621094, 0.010636091232299805, 0.011766910552978516, 0.012897729873657227, 0.014028549194335938, 0.015159368515014648, 0.01629018783569336, 0.01742100715637207, 0.01855182647705078, 0.019682645797729492, 0.020813465118408203, 0.021944284439086914, 0.023075103759765625, 0.024205923080444336, 0.025336742401123047, 0.026467561721801758, 0.02759838104248047, 0.02872920036315918, 0.02986001968383789, 0.0309908390045166, 0.03212165832519531, 0.03325247764587402, 0.034383296966552734, 0.035514116287231445, 0.036644935607910156, 0.03777575492858887, 0.03890657424926758, 0.04003739356994629, 0.041168212890625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 12.0, 14.0, 29.0, 92.0, 242.0, 409.0, 106.0, 45.0, 23.0, 10.0, 11.0, 3.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0162811279296875, -0.015659809112548828, -0.015038490295410156, -0.014417171478271484, -0.013795852661132812, -0.01317453384399414, -0.012553215026855469, -0.011931896209716797, -0.011310577392578125, -0.010689258575439453, -0.010067939758300781, -0.00944662094116211, -0.008825302124023438, -0.008203983306884766, -0.007582664489746094, -0.006961345672607422, -0.00634002685546875, -0.005718708038330078, -0.005097389221191406, -0.004476070404052734, -0.0038547515869140625, -0.0032334327697753906, -0.0026121139526367188, -0.001990795135498047, -0.001369476318359375, -0.0007481575012207031, -0.00012683868408203125, 0.0004944801330566406, 0.0011157989501953125, 0.0017371177673339844, 0.0023584365844726562, 0.002979755401611328, 0.00360107421875, 0.004222393035888672, 0.004843711853027344, 0.005465030670166016, 0.0060863494873046875, 0.006707668304443359, 0.007328987121582031, 0.007950305938720703, 0.008571624755859375, 0.009192943572998047, 0.009814262390136719, 0.01043558120727539, 0.011056900024414062, 0.011678218841552734, 0.012299537658691406, 0.012920856475830078, 0.01354217529296875, 0.014163494110107422, 0.014784812927246094, 0.015406131744384766, 0.016027450561523438, 0.01664876937866211, 0.01727008819580078, 0.017891407012939453, 0.018512725830078125, 0.019134044647216797, 0.01975536346435547, 0.02037668228149414, 0.020998001098632812, 0.021619319915771484, 0.022240638732910156, 0.022861957550048828, 0.0234832763671875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 3.0, 2.0, 6.0, 8.0, 21.0, 10.0, 25.0, 28.0, 38.0, 48.0, 92.0, 176.0, 405.0, 1525.0, 4181691.0, 9140.0, 524.0, 218.0, 109.0, 71.0, 35.0, 29.0, 19.0, 10.0, 6.0, 5.0, 8.0, 6.0, 2.0, 1.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033721923828125, -0.03272056579589844, -0.031719207763671875, -0.030717849731445312, -0.02971649169921875, -0.028715133666992188, -0.027713775634765625, -0.026712417602539062, -0.0257110595703125, -0.024709701538085938, -0.023708343505859375, -0.022706985473632812, -0.02170562744140625, -0.020704269409179688, -0.019702911376953125, -0.018701553344726562, -0.0177001953125, -0.016698837280273438, -0.015697479248046875, -0.014696121215820312, -0.01369476318359375, -0.012693405151367188, -0.011692047119140625, -0.010690689086914062, -0.0096893310546875, -0.008687973022460938, -0.007686614990234375, -0.0066852569580078125, -0.00568389892578125, -0.0046825408935546875, -0.003681182861328125, -0.0026798248291015625, -0.001678466796875, -0.0006771087646484375, 0.000324249267578125, 0.0013256072998046875, 0.00232696533203125, 0.0033283233642578125, 0.004329681396484375, 0.0053310394287109375, 0.0063323974609375, 0.0073337554931640625, 0.008335113525390625, 0.009336471557617188, 0.01033782958984375, 0.011339187622070312, 0.012340545654296875, 0.013341903686523438, 0.01434326171875, 0.015344619750976562, 0.016345977783203125, 0.017347335815429688, 0.01834869384765625, 0.019350051879882812, 0.020351409912109375, 0.021352767944335938, 0.0223541259765625, 0.023355484008789062, 0.024356842041015625, 0.025358200073242188, 0.02635955810546875, 0.027360916137695312, 0.028362274169921875, 0.029363632202148438, 0.030364990234375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 5.0, 4.0, 2.0, 4.0, 8.0, 16.0, 12.0, 21.0, 29.0, 32.0, 48.0, 62.0, 137.0, 269.0, 513.0, 925.0, 900.0, 502.0, 234.0, 120.0, 74.0, 45.0, 33.0, 20.0, 12.0, 7.0, 5.0, 8.0, 7.0, 4.0, 3.0, 2.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007175445556640625, -0.006964385509490967, -0.006753325462341309, -0.00654226541519165, -0.006331205368041992, -0.006120145320892334, -0.005909085273742676, -0.005698025226593018, -0.005486965179443359, -0.005275905132293701, -0.005064845085144043, -0.004853785037994385, -0.0046427249908447266, -0.004431664943695068, -0.00422060489654541, -0.004009544849395752, -0.0037984848022460938, -0.0035874247550964355, -0.0033763647079467773, -0.003165304660797119, -0.002954244613647461, -0.0027431845664978027, -0.0025321245193481445, -0.0023210644721984863, -0.002110004425048828, -0.00189894437789917, -0.0016878843307495117, -0.0014768242835998535, -0.0012657642364501953, -0.0010547041893005371, -0.0008436441421508789, -0.0006325840950012207, -0.0004215240478515625, -0.0002104640007019043, 5.960464477539062e-07, 0.0002116560935974121, 0.0004227161407470703, 0.0006337761878967285, 0.0008448362350463867, 0.001055896282196045, 0.0012669563293457031, 0.0014780163764953613, 0.0016890764236450195, 0.0019001364707946777, 0.002111196517944336, 0.002322256565093994, 0.0025333166122436523, 0.0027443766593933105, 0.0029554367065429688, 0.003166496753692627, 0.003377556800842285, 0.0035886168479919434, 0.0037996768951416016, 0.00401073694229126, 0.004221796989440918, 0.004432857036590576, 0.004643917083740234, 0.004854977130889893, 0.005066037178039551, 0.005277097225189209, 0.005488157272338867, 0.005699217319488525, 0.005910277366638184, 0.006121337413787842, 0.0063323974609375]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 58.0, 756.0, 186.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016395432874560356, -0.01527087390422821, -0.014146314933896065, -0.013021755032241344, -0.011897196061909199, -0.010772637091577053, -0.009648077189922333, -0.008523518219590187, -0.007398959249258041, -0.006274400278925896, -0.005149840842932463, -0.00402528140693903, -0.002900722436606884, -0.0017761634662747383, -0.0006516040302813053, 0.0004729554057121277, 0.0015975143760442734, 0.0027220735792070627, 0.003846632782369852, 0.004971192218363285, 0.006095751188695431, 0.0072203101590275764, 0.008344870060682297, 0.009469429031014442, 0.010593988001346588, 0.011718546971678734, 0.01284310594201088, 0.0139676658436656, 0.015092224813997746, 0.016216784715652466, 0.01734134368598461, 0.018465902656316757, 0.019590459764003754, 0.0207150187343359, 0.021839577704668045, 0.02296413667500019, 0.024088695645332336, 0.02521325647830963, 0.026337815448641777, 0.027462374418973923, 0.02858693338930607, 0.029711492359638214, 0.03083605132997036, 0.031960610300302505, 0.0330851711332798, 0.0342097282409668, 0.03533428907394409, 0.03645884990692139, 0.03758340701460838, 0.03870796784758568, 0.039832524955272675, 0.04095708578824997, 0.042081642895936966, 0.04320620372891426, 0.04433076083660126, 0.04545532166957855, 0.04657988250255585, 0.04770444333553314, 0.04882900044322014, 0.049953561276197433, 0.05107811838388443, 0.052202679216861725, 0.05332723632454872, 0.054451797157526016, 0.05557635426521301]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 2.0, 4.0, 7.0, 9.0, 12.0, 14.0, 16.0, 16.0, 26.0, 24.0, 33.0, 24.0, 37.0, 30.0, 33.0, 40.0, 47.0, 49.0, 49.0, 27.0, 73.0, 58.0, 48.0, 44.0, 41.0, 44.0, 27.0, 28.0, 28.0, 21.0, 13.0, 14.0, 20.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 6.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.016760945320129395, -0.016301672905683517, -0.01584239862859249, -0.01538312528282404, -0.014923851937055588, -0.014464578591287136, -0.014005305245518684, -0.013546031899750233, -0.013086758553981781, -0.01262748520821333, -0.012168211862444878, -0.011708938516676426, -0.011249665170907974, -0.010790391825139523, -0.01033111847937107, -0.00987184513360262, -0.009412571787834167, -0.008953298442065716, -0.008494025096297264, -0.008034751750528812, -0.007575478404760361, -0.007116205058991909, -0.006656931713223457, -0.006197658367455006, -0.005738385021686554, -0.005279111675918102, -0.004819838330149651, -0.004360564984381199, -0.003901291638612747, -0.0034420182928442955, -0.002982744947075844, -0.002523471601307392, -0.0020641982555389404, -0.0016049249097704887, -0.001145651564002037, -0.0006863782182335854, -0.00022710487246513367, 0.00023216847330331802, 0.0006914418190717697, 0.0011507151648402214, 0.001609988510608673, 0.002069261856377125, 0.0025285352021455765, 0.002987808547914028, 0.00344708189368248, 0.0039063552394509315, 0.004365628585219383, 0.004824901930987835, 0.005284175276756287, 0.005743448622524738, 0.00620272196829319, 0.006661995314061642, 0.007121268659830093, 0.007580542005598545, 0.008039815351366997, 0.008499088697135448, 0.0089583620429039, 0.009417635388672352, 0.009876908734440804, 0.010336182080209255, 0.010795455425977707, 0.011254728771746159, 0.01171400211751461, 0.012173275463283062, 0.012632548809051514]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 8.0, 11.0, 10.0, 10.0, 11.0, 8.0, 21.0, 36.0, 25.0, 39.0, 46.0, 75.0, 75.0, 130.0, 206.0, 356.0, 674.0, 1903.0, 10407.0, 956799.0, 70603.0, 4468.0, 1176.0, 558.0, 296.0, 180.0, 132.0, 67.0, 77.0, 35.0, 19.0, 16.0, 12.0, 14.0, 7.0, 4.0, 8.0, 8.0, 2.0, 0.0, 2.0, 3.0, 9.0, 4.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.88818359375, -0.8550338745117188, -0.8218841552734375, -0.7887344360351562, -0.755584716796875, -0.7224349975585938, -0.6892852783203125, -0.6561355590820312, -0.62298583984375, -0.5898361206054688, -0.5566864013671875, -0.5235366821289062, -0.490386962890625, -0.45723724365234375, -0.4240875244140625, -0.39093780517578125, -0.3577880859375, -0.32463836669921875, -0.2914886474609375, -0.25833892822265625, -0.225189208984375, -0.19203948974609375, -0.1588897705078125, -0.12574005126953125, -0.09259033203125, -0.05944061279296875, -0.0262908935546875, 0.00685882568359375, 0.040008544921875, 0.07315826416015625, 0.1063079833984375, 0.13945770263671875, 0.172607421875, 0.20575714111328125, 0.2389068603515625, 0.27205657958984375, 0.305206298828125, 0.33835601806640625, 0.3715057373046875, 0.40465545654296875, 0.43780517578125, 0.47095489501953125, 0.5041046142578125, 0.5372543334960938, 0.570404052734375, 0.6035537719726562, 0.6367034912109375, 0.6698532104492188, 0.7030029296875, 0.7361526489257812, 0.7693023681640625, 0.8024520874023438, 0.835601806640625, 0.8687515258789062, 0.9019012451171875, 0.9350509643554688, 0.96820068359375, 1.0013504028320312, 1.0345001220703125, 1.0676498413085938, 1.100799560546875, 1.1339492797851562, 1.1670989990234375, 1.2002487182617188, 1.2333984375]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 12.0, 12.0, 25.0, 72.0, 214.0, 410.0, 143.0, 58.0, 25.0, 9.0, 14.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.01611328125, -0.015502691268920898, -0.014892101287841797, -0.014281511306762695, -0.013670921325683594, -0.013060331344604492, -0.01244974136352539, -0.011839151382446289, -0.011228561401367188, -0.010617971420288086, -0.010007381439208984, -0.009396791458129883, -0.008786201477050781, -0.00817561149597168, -0.007565021514892578, -0.0069544315338134766, -0.006343841552734375, -0.0057332515716552734, -0.005122661590576172, -0.00451207160949707, -0.0039014816284179688, -0.003290891647338867, -0.0026803016662597656, -0.002069711685180664, -0.0014591217041015625, -0.0008485317230224609, -0.00023794174194335938, 0.0003726482391357422, 0.0009832382202148438, 0.0015938282012939453, 0.002204418182373047, 0.0028150081634521484, 0.00342559814453125, 0.0040361881256103516, 0.004646778106689453, 0.005257368087768555, 0.005867958068847656, 0.006478548049926758, 0.007089138031005859, 0.007699728012084961, 0.008310317993164062, 0.008920907974243164, 0.009531497955322266, 0.010142087936401367, 0.010752677917480469, 0.01136326789855957, 0.011973857879638672, 0.012584447860717773, 0.013195037841796875, 0.013805627822875977, 0.014416217803955078, 0.01502680778503418, 0.01563739776611328, 0.016247987747192383, 0.016858577728271484, 0.017469167709350586, 0.018079757690429688, 0.01869034767150879, 0.01930093765258789, 0.019911527633666992, 0.020522117614746094, 0.021132707595825195, 0.021743297576904297, 0.0223538875579834, 0.0229644775390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 9.0, 2.0, 4.0, 9.0, 14.0, 18.0, 24.0, 33.0, 60.0, 88.0, 116.0, 181.0, 268.0, 440.0, 634.0, 996.0, 1512.0, 2510.0, 3882.0, 6336.0, 10179.0, 16757.0, 30673.0, 60794.0, 144917.0, 434088.0, 180159.0, 70329.0, 34581.0, 19091.0, 11203.0, 6798.0, 4311.0, 2732.0, 1703.0, 1106.0, 674.0, 421.0, 291.0, 209.0, 127.0, 80.0, 60.0, 45.0, 32.0, 17.0, 6.0, 15.0, 9.0, 4.0, 3.0, 5.0, 2.0, 3.0, 1.0, 2.0], "bins": [-0.0223388671875, -0.021673917770385742, -0.021008968353271484, -0.020344018936157227, -0.01967906951904297, -0.01901412010192871, -0.018349170684814453, -0.017684221267700195, -0.017019271850585938, -0.01635432243347168, -0.015689373016357422, -0.015024423599243164, -0.014359474182128906, -0.013694524765014648, -0.01302957534790039, -0.012364625930786133, -0.011699676513671875, -0.011034727096557617, -0.01036977767944336, -0.009704828262329102, -0.009039878845214844, -0.008374929428100586, -0.007709980010986328, -0.00704503059387207, -0.0063800811767578125, -0.005715131759643555, -0.005050182342529297, -0.004385232925415039, -0.0037202835083007812, -0.0030553340911865234, -0.0023903846740722656, -0.0017254352569580078, -0.00106048583984375, -0.0003955364227294922, 0.0002694129943847656, 0.0009343624114990234, 0.0015993118286132812, 0.002264261245727539, 0.002929210662841797, 0.0035941600799560547, 0.0042591094970703125, 0.00492405891418457, 0.005589008331298828, 0.006253957748413086, 0.006918907165527344, 0.0075838565826416016, 0.00824880599975586, 0.008913755416870117, 0.009578704833984375, 0.010243654251098633, 0.01090860366821289, 0.011573553085327148, 0.012238502502441406, 0.012903451919555664, 0.013568401336669922, 0.01423335075378418, 0.014898300170898438, 0.015563249588012695, 0.016228199005126953, 0.01689314842224121, 0.01755809783935547, 0.018223047256469727, 0.018887996673583984, 0.019552946090698242, 0.0202178955078125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 6.0, 7.0, 3.0, 4.0, 5.0, 13.0, 9.0, 10.0, 17.0, 10.0, 23.0, 9.0, 15.0, 11.0, 21.0, 35.0, 44.0, 32.0, 29.0, 38.0, 39.0, 34.0, 37.0, 29.0, 40.0, 42.0, 38.0, 33.0, 30.0, 43.0, 26.0, 33.0, 20.0, 38.0, 23.0, 14.0, 22.0, 19.0, 16.0, 11.0, 11.0, 9.0, 10.0, 7.0, 13.0, 5.0, 3.0, 4.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01287841796875, -0.012460589408874512, -0.012042760848999023, -0.011624932289123535, -0.011207103729248047, -0.010789275169372559, -0.01037144660949707, -0.009953618049621582, -0.009535789489746094, -0.009117960929870605, -0.008700132369995117, -0.008282303810119629, -0.00786447525024414, -0.007446646690368652, -0.007028818130493164, -0.006610989570617676, -0.0061931610107421875, -0.005775332450866699, -0.005357503890991211, -0.004939675331115723, -0.004521846771240234, -0.004104018211364746, -0.003686189651489258, -0.0032683610916137695, -0.0028505325317382812, -0.002432703971862793, -0.0020148754119873047, -0.0015970468521118164, -0.0011792182922363281, -0.0007613897323608398, -0.00034356117248535156, 7.426738739013672e-05, 0.000492095947265625, 0.0009099245071411133, 0.0013277530670166016, 0.0017455816268920898, 0.002163410186767578, 0.0025812387466430664, 0.0029990673065185547, 0.003416895866394043, 0.0038347244262695312, 0.0042525529861450195, 0.004670381546020508, 0.005088210105895996, 0.005506038665771484, 0.005923867225646973, 0.006341695785522461, 0.006759524345397949, 0.0071773529052734375, 0.007595181465148926, 0.008013010025024414, 0.008430838584899902, 0.00884866714477539, 0.009266495704650879, 0.009684324264526367, 0.010102152824401855, 0.010519981384277344, 0.010937809944152832, 0.01135563850402832, 0.011773467063903809, 0.012191295623779297, 0.012609124183654785, 0.013026952743530273, 0.013444781303405762, 0.01386260986328125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 2.0, 2.0, 8.0, 5.0, 14.0, 9.0, 30.0, 38.0, 78.0, 175.0, 266.0, 710.0, 1957.0, 6265.0, 30284.0, 636974.0, 339980.0, 23584.0, 5311.0, 1656.0, 640.0, 290.0, 127.0, 59.0, 34.0, 25.0, 10.0, 9.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0146026611328125, -0.014097929000854492, -0.013593196868896484, -0.013088464736938477, -0.012583732604980469, -0.012079000473022461, -0.011574268341064453, -0.011069536209106445, -0.010564804077148438, -0.01006007194519043, -0.009555339813232422, -0.009050607681274414, -0.008545875549316406, -0.008041143417358398, -0.007536411285400391, -0.007031679153442383, -0.006526947021484375, -0.006022214889526367, -0.005517482757568359, -0.0050127506256103516, -0.004508018493652344, -0.004003286361694336, -0.003498554229736328, -0.0029938220977783203, -0.0024890899658203125, -0.0019843578338623047, -0.0014796257019042969, -0.0009748935699462891, -0.00047016143798828125, 3.457069396972656e-05, 0.0005393028259277344, 0.0010440349578857422, 0.00154876708984375, 0.002053499221801758, 0.0025582313537597656, 0.0030629634857177734, 0.0035676956176757812, 0.004072427749633789, 0.004577159881591797, 0.005081892013549805, 0.0055866241455078125, 0.00609135627746582, 0.006596088409423828, 0.007100820541381836, 0.007605552673339844, 0.008110284805297852, 0.00861501693725586, 0.009119749069213867, 0.009624481201171875, 0.010129213333129883, 0.01063394546508789, 0.011138677597045898, 0.011643409729003906, 0.012148141860961914, 0.012652873992919922, 0.01315760612487793, 0.013662338256835938, 0.014167070388793945, 0.014671802520751953, 0.015176534652709961, 0.01568126678466797, 0.016185998916625977, 0.016690731048583984, 0.017195463180541992, 0.0177001953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 1.0, 4.0, 7.0, 5.0, 6.0, 13.0, 18.0, 24.0, 20.0, 25.0, 53.0, 82.0, 197.0, 257.0, 114.0, 61.0, 24.0, 27.0, 22.0, 8.0, 12.0, 5.0, 5.0, 2.0, 0.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011116266250610352, -0.00010690558701753616, -0.00010264851152896881, -9.839143604040146e-05, -9.41343605518341e-05, -8.987728506326675e-05, -8.56202095746994e-05, -8.136313408613205e-05, -7.71060585975647e-05, -7.284898310899734e-05, -6.859190762042999e-05, -6.433483213186264e-05, -6.007775664329529e-05, -5.5820681154727936e-05, -5.1563605666160583e-05, -4.730653017759323e-05, -4.304945468902588e-05, -3.8792379200458527e-05, -3.4535303711891174e-05, -3.0278228223323822e-05, -2.602115273475647e-05, -2.1764077246189117e-05, -1.7507001757621765e-05, -1.3249926269054413e-05, -8.99285078048706e-06, -4.735775291919708e-06, -4.78699803352356e-07, 3.7783756852149963e-06, 8.035451173782349e-06, 1.2292526662349701e-05, 1.6549602150917053e-05, 2.0806677639484406e-05, 2.5063753128051758e-05, 2.932082861661911e-05, 3.357790410518646e-05, 3.7834979593753815e-05, 4.209205508232117e-05, 4.634913057088852e-05, 5.060620605945587e-05, 5.4863281548023224e-05, 5.9120357036590576e-05, 6.337743252515793e-05, 6.763450801372528e-05, 7.189158350229263e-05, 7.614865899085999e-05, 8.040573447942734e-05, 8.466280996799469e-05, 8.891988545656204e-05, 9.31769609451294e-05, 9.743403643369675e-05, 0.0001016911119222641, 0.00010594818741083145, 0.0001102052628993988, 0.00011446233838796616, 0.00011871941387653351, 0.00012297648936510086, 0.0001272335648536682, 0.00013149064034223557, 0.00013574771583080292, 0.00014000479131937027, 0.00014426186680793762, 0.00014851894229650497, 0.00015277601778507233, 0.00015703309327363968, 0.00016129016876220703]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 7.0, 1.0, 5.0, 6.0, 6.0, 4.0, 9.0, 21.0, 20.0, 43.0, 78.0, 163.0, 393.0, 1652.0, 17862.0, 1000452.0, 24913.0, 2101.0, 441.0, 168.0, 72.0, 41.0, 29.0, 14.0, 11.0, 14.0, 10.0, 9.0, 7.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046966552734375, -0.045523643493652344, -0.04408073425292969, -0.04263782501220703, -0.041194915771484375, -0.03975200653076172, -0.03830909729003906, -0.036866188049316406, -0.03542327880859375, -0.033980369567871094, -0.03253746032714844, -0.03109455108642578, -0.029651641845703125, -0.02820873260498047, -0.026765823364257812, -0.025322914123535156, -0.0238800048828125, -0.022437095642089844, -0.020994186401367188, -0.01955127716064453, -0.018108367919921875, -0.01666545867919922, -0.015222549438476562, -0.013779640197753906, -0.01233673095703125, -0.010893821716308594, -0.009450912475585938, -0.008008003234863281, -0.006565093994140625, -0.005122184753417969, -0.0036792755126953125, -0.0022363662719726562, -0.00079345703125, 0.0006494522094726562, 0.0020923614501953125, 0.0035352706909179688, 0.004978179931640625, 0.006421089172363281, 0.007863998413085938, 0.009306907653808594, 0.01074981689453125, 0.012192726135253906, 0.013635635375976562, 0.015078544616699219, 0.016521453857421875, 0.01796436309814453, 0.019407272338867188, 0.020850181579589844, 0.0222930908203125, 0.023736000061035156, 0.025178909301757812, 0.02662181854248047, 0.028064727783203125, 0.02950763702392578, 0.030950546264648438, 0.032393455505371094, 0.03383636474609375, 0.035279273986816406, 0.03672218322753906, 0.03816509246826172, 0.039608001708984375, 0.04105091094970703, 0.04249382019042969, 0.043936729431152344, 0.045379638671875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 0.0, 5.0, 9.0, 5.0, 6.0, 10.0, 10.0, 14.0, 15.0, 34.0, 50.0, 60.0, 132.0, 225.0, 178.0, 76.0, 43.0, 30.0, 32.0, 11.0, 14.0, 8.0, 10.0, 5.0, 4.0, 6.0, 2.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00982666015625, -0.009516716003417969, -0.009206771850585938, -0.008896827697753906, -0.008586883544921875, -0.008276939392089844, -0.007966995239257812, -0.007657051086425781, -0.00734710693359375, -0.007037162780761719, -0.0067272186279296875, -0.006417274475097656, -0.006107330322265625, -0.005797386169433594, -0.0054874420166015625, -0.005177497863769531, -0.0048675537109375, -0.004557609558105469, -0.0042476654052734375, -0.003937721252441406, -0.003627777099609375, -0.0033178329467773438, -0.0030078887939453125, -0.0026979446411132812, -0.00238800048828125, -0.0020780563354492188, -0.0017681121826171875, -0.0014581680297851562, -0.001148223876953125, -0.0008382797241210938, -0.0005283355712890625, -0.00021839141845703125, 9.1552734375e-05, 0.00040149688720703125, 0.0007114410400390625, 0.0010213851928710938, 0.001331329345703125, 0.0016412734985351562, 0.0019512176513671875, 0.0022611618041992188, 0.00257110595703125, 0.0028810501098632812, 0.0031909942626953125, 0.0035009384155273438, 0.003810882568359375, 0.004120826721191406, 0.0044307708740234375, 0.004740715026855469, 0.0050506591796875, 0.005360603332519531, 0.0056705474853515625, 0.005980491638183594, 0.006290435791015625, 0.006600379943847656, 0.0069103240966796875, 0.007220268249511719, 0.00753021240234375, 0.007840156555175781, 0.008150100708007812, 0.008460044860839844, 0.008769989013671875, 0.009079933166503906, 0.009389877319335938, 0.009699821472167969, 0.010009765625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 11.0, 93.0, 613.0, 228.0, 49.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9773010611534119, -0.9563300609588623, -0.9353590607643127, -0.9143880605697632, -0.8934170007705688, -0.8724460005760193, -0.8514750003814697, -0.8305040001869202, -0.8095329999923706, -0.788561999797821, -0.7675909996032715, -0.7466199398040771, -0.7256489396095276, -0.704677939414978, -0.6837069392204285, -0.6627359390258789, -0.6417648792266846, -0.620793879032135, -0.5998228788375854, -0.5788518190383911, -0.5578808188438416, -0.536909818649292, -0.5159388184547424, -0.49496781826019287, -0.4739967882633209, -0.45302578806877136, -0.4320547580718994, -0.41108375787734985, -0.3901127576828003, -0.36914172768592834, -0.3481707274913788, -0.32719969749450684, -0.3062286972999573, -0.2852576971054077, -0.26428666710853577, -0.2433156669139862, -0.22234465181827545, -0.2013736367225647, -0.18040263652801514, -0.15943162143230438, -0.13846060633659363, -0.11748959124088287, -0.09651858359575272, -0.07554757595062256, -0.054576560854911804, -0.03360554575920105, -0.01263454556465149, 0.008336469531059265, 0.02930748462677002, 0.050278495997190475, 0.07124950736761093, 0.09222051501274109, 0.11319153010845184, 0.1341625452041626, 0.15513354539871216, 0.1761045604944229, 0.19707557559013367, 0.21804659068584442, 0.23901760578155518, 0.25998860597610474, 0.2809596061706543, 0.30193063616752625, 0.3229016363620758, 0.34387266635894775, 0.3648436665534973]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 6.0, 10.0, 12.0, 14.0, 16.0, 16.0, 20.0, 25.0, 28.0, 38.0, 56.0, 37.0, 51.0, 56.0, 69.0, 81.0, 60.0, 61.0, 44.0, 46.0, 58.0, 38.0, 36.0, 35.0, 17.0, 23.0, 17.0, 9.0, 8.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11985033750534058, -0.11644826084375381, -0.11304618418216705, -0.10964410752058029, -0.10624203085899353, -0.10283994674682617, -0.09943787008523941, -0.09603579342365265, -0.09263371676206589, -0.08923164010047913, -0.08582956343889236, -0.0824274867773056, -0.07902540266513824, -0.07562333345413208, -0.07222124934196472, -0.06881917268037796, -0.0654170960187912, -0.06201501935720444, -0.058612942695617676, -0.055210862308740616, -0.051808785647153854, -0.04840670898556709, -0.04500462859869003, -0.04160255193710327, -0.03820047527551651, -0.03479839861392975, -0.03139632195234299, -0.027994241565465927, -0.024592164903879166, -0.021190088242292404, -0.017788009718060493, -0.014385931193828583, -0.010983854532241821, -0.007581776939332485, -0.004179699346423149, -0.000777621753513813, 0.002624455839395523, 0.0060265325009822845, 0.009428611025214195, 0.012830689549446106, 0.016232766211032867, 0.01963484287261963, 0.02303692139685154, 0.02643899992108345, 0.029841076582670212, 0.03324315324425697, 0.03664523363113403, 0.040047310292720795, 0.043449386954307556, 0.04685146361589432, 0.05025354027748108, 0.05365562066435814, 0.0570576973259449, 0.06045977398753166, 0.06386185437440872, 0.06726393103599548, 0.07066600769758224, 0.074068084359169, 0.07747016102075577, 0.08087223768234253, 0.08427432179450989, 0.08767639100551605, 0.09107847511768341, 0.09448055177927017, 0.09788262844085693]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 4.0, 10.0, 9.0, 7.0, 13.0, 19.0, 29.0, 31.0, 40.0, 59.0, 79.0, 100.0, 166.0, 270.0, 672.0, 3148.0, 50067.0, 4128339.0, 8895.0, 1291.0, 337.0, 184.0, 99.0, 91.0, 74.0, 55.0, 39.0, 41.0, 24.0, 19.0, 17.0, 19.0, 9.0, 12.0, 8.0, 3.0, 4.0, 2.0, 1.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.1401195526123047, -0.13497543334960938, -0.12983131408691406, -0.12468719482421875, -0.11954307556152344, -0.11439895629882812, -0.10925483703613281, -0.1041107177734375, -0.09896659851074219, -0.09382247924804688, -0.08867835998535156, -0.08353424072265625, -0.07839012145996094, -0.07324600219726562, -0.06810188293457031, -0.062957763671875, -0.05781364440917969, -0.052669525146484375, -0.04752540588378906, -0.04238128662109375, -0.03723716735839844, -0.032093048095703125, -0.026948928833007812, -0.0218048095703125, -0.016660690307617188, -0.011516571044921875, -0.0063724517822265625, -0.00122833251953125, 0.0039157867431640625, 0.009059906005859375, 0.014204025268554688, 0.01934814453125, 0.024492263793945312, 0.029636383056640625, 0.03478050231933594, 0.03992462158203125, 0.04506874084472656, 0.050212860107421875, 0.05535697937011719, 0.0605010986328125, 0.06564521789550781, 0.07078933715820312, 0.07593345642089844, 0.08107757568359375, 0.08622169494628906, 0.09136581420898438, 0.09650993347167969, 0.101654052734375, 0.10679817199707031, 0.11194229125976562, 0.11708641052246094, 0.12223052978515625, 0.12737464904785156, 0.13251876831054688, 0.1376628875732422, 0.1428070068359375, 0.1479511260986328, 0.15309524536132812, 0.15823936462402344, 0.16338348388671875, 0.16852760314941406, 0.17367172241210938, 0.1788158416748047, 0.1839599609375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 9.0, 21.0, 56.0, 147.0, 314.0, 268.0, 100.0, 36.0, 21.0, 9.0, 9.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0161895751953125, -0.01560831069946289, -0.015027046203613281, -0.014445781707763672, -0.013864517211914062, -0.013283252716064453, -0.012701988220214844, -0.012120723724365234, -0.011539459228515625, -0.010958194732666016, -0.010376930236816406, -0.009795665740966797, -0.009214401245117188, -0.008633136749267578, -0.008051872253417969, -0.007470607757568359, -0.00688934326171875, -0.006308078765869141, -0.005726814270019531, -0.005145549774169922, -0.0045642852783203125, -0.003983020782470703, -0.0034017562866210938, -0.0028204917907714844, -0.002239227294921875, -0.0016579627990722656, -0.0010766983032226562, -0.0004954338073730469, 8.58306884765625e-05, 0.0006670951843261719, 0.0012483596801757812, 0.0018296241760253906, 0.002410888671875, 0.0029921531677246094, 0.0035734176635742188, 0.004154682159423828, 0.0047359466552734375, 0.005317211151123047, 0.005898475646972656, 0.006479740142822266, 0.007061004638671875, 0.007642269134521484, 0.008223533630371094, 0.008804798126220703, 0.009386062622070312, 0.009967327117919922, 0.010548591613769531, 0.01112985610961914, 0.01171112060546875, 0.01229238510131836, 0.012873649597167969, 0.013454914093017578, 0.014036178588867188, 0.014617443084716797, 0.015198707580566406, 0.015779972076416016, 0.016361236572265625, 0.016942501068115234, 0.017523765563964844, 0.018105030059814453, 0.018686294555664062, 0.019267559051513672, 0.01984882354736328, 0.02043008804321289, 0.0210113525390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 14.0, 26.0, 52.0, 57.0, 156.0, 293.0, 695.0, 2492.0, 28258.0, 4023157.0, 132016.0, 5308.0, 1020.0, 379.0, 158.0, 96.0, 41.0, 25.0, 17.0, 8.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08380126953125, -0.0817418098449707, -0.0796823501586914, -0.07762289047241211, -0.07556343078613281, -0.07350397109985352, -0.07144451141357422, -0.06938505172729492, -0.06732559204101562, -0.06526613235473633, -0.06320667266845703, -0.061147212982177734, -0.05908775329589844, -0.05702829360961914, -0.054968833923339844, -0.05290937423706055, -0.05084991455078125, -0.04879045486450195, -0.046730995178222656, -0.04467153549194336, -0.04261207580566406, -0.040552616119384766, -0.03849315643310547, -0.03643369674682617, -0.034374237060546875, -0.03231477737426758, -0.03025531768798828, -0.028195858001708984, -0.026136398315429688, -0.02407693862915039, -0.022017478942871094, -0.019958019256591797, -0.0178985595703125, -0.015839099884033203, -0.013779640197753906, -0.01172018051147461, -0.009660720825195312, -0.007601261138916016, -0.005541801452636719, -0.003482341766357422, -0.001422882080078125, 0.0006365776062011719, 0.0026960372924804688, 0.004755496978759766, 0.0068149566650390625, 0.00887441635131836, 0.010933876037597656, 0.012993335723876953, 0.01505279541015625, 0.017112255096435547, 0.019171714782714844, 0.02123117446899414, 0.023290634155273438, 0.025350093841552734, 0.02740955352783203, 0.029469013214111328, 0.031528472900390625, 0.03358793258666992, 0.03564739227294922, 0.037706851959228516, 0.03976631164550781, 0.04182577133178711, 0.043885231018066406, 0.0459446907043457, 0.048004150390625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 7.0, 8.0, 11.0, 19.0, 18.0, 24.0, 34.0, 83.0, 119.0, 215.0, 537.0, 1919.0, 573.0, 232.0, 110.0, 70.0, 36.0, 24.0, 19.0, 7.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0299224853515625, -0.029292821884155273, -0.028663158416748047, -0.02803349494934082, -0.027403831481933594, -0.026774168014526367, -0.02614450454711914, -0.025514841079711914, -0.024885177612304688, -0.02425551414489746, -0.023625850677490234, -0.022996187210083008, -0.02236652374267578, -0.021736860275268555, -0.021107196807861328, -0.0204775333404541, -0.019847869873046875, -0.01921820640563965, -0.018588542938232422, -0.017958879470825195, -0.01732921600341797, -0.016699552536010742, -0.016069889068603516, -0.015440225601196289, -0.014810562133789062, -0.014180898666381836, -0.01355123519897461, -0.012921571731567383, -0.012291908264160156, -0.01166224479675293, -0.011032581329345703, -0.010402917861938477, -0.00977325439453125, -0.009143590927124023, -0.008513927459716797, -0.00788426399230957, -0.007254600524902344, -0.006624937057495117, -0.005995273590087891, -0.005365610122680664, -0.0047359466552734375, -0.004106283187866211, -0.0034766197204589844, -0.002846956253051758, -0.0022172927856445312, -0.0015876293182373047, -0.0009579658508300781, -0.00032830238342285156, 0.000301361083984375, 0.0009310245513916016, 0.0015606880187988281, 0.0021903514862060547, 0.0028200149536132812, 0.003449678421020508, 0.004079341888427734, 0.004709005355834961, 0.0053386688232421875, 0.005968332290649414, 0.006597995758056641, 0.007227659225463867, 0.007857322692871094, 0.00848698616027832, 0.009116649627685547, 0.009746313095092773, 0.0103759765625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 16.0, 42.0, 136.0, 384.0, 317.0, 84.0, 19.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1301613450050354, -0.12550246715545654, -0.12084360420703888, -0.11618472635746002, -0.11152585595846176, -0.1068669855594635, -0.10220810770988464, -0.09754923731088638, -0.09289036691188812, -0.08823149651288986, -0.0835726261138916, -0.07891374826431274, -0.07425487786531448, -0.06959600746631622, -0.06493712961673737, -0.060278259217739105, -0.055619388818740845, -0.050960518419742584, -0.046301644295454025, -0.041642770171165466, -0.036983899772167206, -0.032325029373168945, -0.027666155248880386, -0.023007281124591827, -0.018348410725593567, -0.013689538463950157, -0.009030666202306747, -0.004371793940663338, 0.000287078320980072, 0.004945950582623482, 0.009604822844266891, 0.01426369696855545, 0.01892256736755371, 0.02358143962919712, 0.02824031189084053, 0.03289918601512909, 0.03755805641412735, 0.04221692681312561, 0.04687580093741417, 0.05153467506170273, 0.05619354546070099, 0.06085241585969925, 0.06551128625869751, 0.07017016410827637, 0.07482903450727463, 0.07948790490627289, 0.08414678275585175, 0.08880565315485, 0.09346452355384827, 0.09812339395284653, 0.10278226435184479, 0.10744114220142365, 0.1121000126004219, 0.11675888299942017, 0.12141776084899902, 0.12607663869857788, 0.13073550164699554, 0.1353943794965744, 0.14005324244499207, 0.14471212029457092, 0.14937099814414978, 0.15402986109256744, 0.1586887389421463, 0.16334760189056396, 0.16800647974014282]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 10.0, 11.0, 13.0, 13.0, 14.0, 18.0, 29.0, 33.0, 41.0, 37.0, 43.0, 27.0, 35.0, 37.0, 43.0, 47.0, 52.0, 46.0, 52.0, 51.0, 44.0, 46.0, 32.0, 39.0, 28.0, 21.0, 26.0, 23.0, 21.0, 16.0, 11.0, 14.0, 12.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.049556076526641846, -0.04827851057052612, -0.0470009446144104, -0.04572337493300438, -0.04444580897688866, -0.043168243020772934, -0.04189067333936691, -0.04061310738325119, -0.03933554142713547, -0.038057975471019745, -0.03678040951490402, -0.035502839833498, -0.03422527387738228, -0.032947707921266556, -0.031670138239860535, -0.030392572283744812, -0.02911500632762909, -0.027837440371513367, -0.026559872552752495, -0.025282304733991623, -0.0240047387778759, -0.022727172821760178, -0.021449605002999306, -0.020172037184238434, -0.01889447122812271, -0.01761690527200699, -0.016339337453246117, -0.01506177056580782, -0.013784203678369522, -0.012506636790931225, -0.011229069903492928, -0.00995150301605463, -0.008673936128616333, -0.007396369241178036, -0.0061188023537397385, -0.004841235466301441, -0.003563668578863144, -0.0022861016914248466, -0.0010085348039865494, 0.0002690320834517479, 0.0015465989708900452, 0.0028241658583283424, 0.00410173274576664, 0.005379299633204937, 0.006656866520643234, 0.007934433408081532, 0.009212000295519829, 0.010489567182958126, 0.011767134070396423, 0.01304470095783472, 0.014322267845273018, 0.015599834732711315, 0.016877401620149612, 0.018154967576265335, 0.019432535395026207, 0.02071010321378708, 0.0219876691699028, 0.023265235126018524, 0.024542802944779396, 0.025820370763540268, 0.02709793671965599, 0.028375502675771713, 0.029653070494532585, 0.030930638313293457, 0.03220820426940918]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 3.0, 6.0, 10.0, 26.0, 13.0, 21.0, 43.0, 40.0, 52.0, 78.0, 87.0, 123.0, 167.0, 264.0, 366.0, 619.0, 1465.0, 7212.0, 299703.0, 723420.0, 10980.0, 1772.0, 722.0, 398.0, 255.0, 191.0, 117.0, 110.0, 67.0, 33.0, 49.0, 32.0, 27.0, 22.0, 18.0, 8.0, 10.0, 5.0, 5.0, 5.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0693359375, -0.06710529327392578, -0.06487464904785156, -0.06264400482177734, -0.060413360595703125, -0.058182716369628906, -0.05595207214355469, -0.05372142791748047, -0.05149078369140625, -0.04926013946533203, -0.04702949523925781, -0.044798851013183594, -0.042568206787109375, -0.040337562561035156, -0.03810691833496094, -0.03587627410888672, -0.0336456298828125, -0.03141498565673828, -0.029184341430664062, -0.026953697204589844, -0.024723052978515625, -0.022492408752441406, -0.020261764526367188, -0.01803112030029297, -0.01580047607421875, -0.013569831848144531, -0.011339187622070312, -0.009108543395996094, -0.006877899169921875, -0.004647254943847656, -0.0024166107177734375, -0.00018596649169921875, 0.002044677734375, 0.004275321960449219, 0.0065059661865234375, 0.008736610412597656, 0.010967254638671875, 0.013197898864746094, 0.015428543090820312, 0.01765918731689453, 0.01988983154296875, 0.02212047576904297, 0.024351119995117188, 0.026581764221191406, 0.028812408447265625, 0.031043052673339844, 0.03327369689941406, 0.03550434112548828, 0.0377349853515625, 0.03996562957763672, 0.04219627380371094, 0.044426918029785156, 0.046657562255859375, 0.048888206481933594, 0.05111885070800781, 0.05334949493408203, 0.05558013916015625, 0.05781078338623047, 0.06004142761230469, 0.062272071838378906, 0.06450271606445312, 0.06673336029052734, 0.06896400451660156, 0.07119464874267578, 0.07342529296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 12.0, 12.0, 26.0, 82.0, 180.0, 360.0, 192.0, 70.0, 38.0, 11.0, 12.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0154266357421875, -0.01484537124633789, -0.014264106750488281, -0.013682842254638672, -0.013101577758789062, -0.012520313262939453, -0.011939048767089844, -0.011357784271240234, -0.010776519775390625, -0.010195255279541016, -0.009613990783691406, -0.009032726287841797, -0.008451461791992188, -0.007870197296142578, -0.007288932800292969, -0.006707668304443359, -0.00612640380859375, -0.005545139312744141, -0.004963874816894531, -0.004382610321044922, -0.0038013458251953125, -0.003220081329345703, -0.0026388168334960938, -0.0020575523376464844, -0.001476287841796875, -0.0008950233459472656, -0.00031375885009765625, 0.0002675056457519531, 0.0008487701416015625, 0.0014300346374511719, 0.0020112991333007812, 0.0025925636291503906, 0.003173828125, 0.0037550926208496094, 0.004336357116699219, 0.004917621612548828, 0.0054988861083984375, 0.006080150604248047, 0.006661415100097656, 0.007242679595947266, 0.007823944091796875, 0.008405208587646484, 0.008986473083496094, 0.009567737579345703, 0.010149002075195312, 0.010730266571044922, 0.011311531066894531, 0.01189279556274414, 0.01247406005859375, 0.01305532455444336, 0.013636589050292969, 0.014217853546142578, 0.014799118041992188, 0.015380382537841797, 0.015961647033691406, 0.016542911529541016, 0.017124176025390625, 0.017705440521240234, 0.018286705017089844, 0.018867969512939453, 0.019449234008789062, 0.020030498504638672, 0.02061176300048828, 0.02119302749633789, 0.0217742919921875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 2.0, 13.0, 13.0, 17.0, 21.0, 32.0, 38.0, 47.0, 54.0, 99.0, 112.0, 181.0, 322.0, 837.0, 16906.0, 1009734.0, 18283.0, 929.0, 296.0, 173.0, 127.0, 78.0, 43.0, 56.0, 36.0, 20.0, 20.0, 15.0, 15.0, 10.0, 8.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08892822265625, -0.08580875396728516, -0.08268928527832031, -0.07956981658935547, -0.07645034790039062, -0.07333087921142578, -0.07021141052246094, -0.0670919418334961, -0.06397247314453125, -0.060853004455566406, -0.05773353576660156, -0.05461406707763672, -0.051494598388671875, -0.04837512969970703, -0.04525566101074219, -0.042136192321777344, -0.0390167236328125, -0.035897254943847656, -0.03277778625488281, -0.02965831756591797, -0.026538848876953125, -0.02341938018798828, -0.020299911499023438, -0.017180442810058594, -0.01406097412109375, -0.010941505432128906, -0.007822036743164062, -0.004702568054199219, -0.001583099365234375, 0.0015363693237304688, 0.0046558380126953125, 0.007775306701660156, 0.010894775390625, 0.014014244079589844, 0.017133712768554688, 0.02025318145751953, 0.023372650146484375, 0.02649211883544922, 0.029611587524414062, 0.032731056213378906, 0.03585052490234375, 0.038969993591308594, 0.04208946228027344, 0.04520893096923828, 0.048328399658203125, 0.05144786834716797, 0.05456733703613281, 0.057686805725097656, 0.0608062744140625, 0.06392574310302734, 0.06704521179199219, 0.07016468048095703, 0.07328414916992188, 0.07640361785888672, 0.07952308654785156, 0.0826425552368164, 0.08576202392578125, 0.0888814926147461, 0.09200096130371094, 0.09512042999267578, 0.09823989868164062, 0.10135936737060547, 0.10447883605957031, 0.10759830474853516, 0.1107177734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 8.0, 2.0, 6.0, 14.0, 12.0, 13.0, 23.0, 24.0, 27.0, 31.0, 41.0, 41.0, 41.0, 56.0, 55.0, 61.0, 63.0, 51.0, 49.0, 70.0, 45.0, 51.0, 46.0, 23.0, 28.0, 31.0, 20.0, 16.0, 11.0, 11.0, 13.0, 6.0, 11.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01403045654296875, -0.013530611991882324, -0.013030767440795898, -0.012530922889709473, -0.012031078338623047, -0.011531233787536621, -0.011031389236450195, -0.01053154468536377, -0.010031700134277344, -0.009531855583190918, -0.009032011032104492, -0.008532166481018066, -0.00803232192993164, -0.007532477378845215, -0.007032632827758789, -0.006532788276672363, -0.0060329437255859375, -0.005533099174499512, -0.005033254623413086, -0.00453341007232666, -0.004033565521240234, -0.0035337209701538086, -0.003033876419067383, -0.002534031867980957, -0.0020341873168945312, -0.0015343427658081055, -0.0010344982147216797, -0.0005346536636352539, -3.4809112548828125e-05, 0.00046503543853759766, 0.0009648799896240234, 0.0014647245407104492, 0.001964569091796875, 0.0024644136428833008, 0.0029642581939697266, 0.0034641027450561523, 0.003963947296142578, 0.004463791847229004, 0.00496363639831543, 0.0054634809494018555, 0.005963325500488281, 0.006463170051574707, 0.006963014602661133, 0.007462859153747559, 0.007962703704833984, 0.00846254825592041, 0.008962392807006836, 0.009462237358093262, 0.009962081909179688, 0.010461926460266113, 0.010961771011352539, 0.011461615562438965, 0.01196146011352539, 0.012461304664611816, 0.012961149215698242, 0.013460993766784668, 0.013960838317871094, 0.01446068286895752, 0.014960527420043945, 0.015460371971130371, 0.015960216522216797, 0.016460061073303223, 0.01695990562438965, 0.017459750175476074, 0.0179595947265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 7.0, 9.0, 7.0, 9.0, 15.0, 17.0, 37.0, 51.0, 106.0, 283.0, 932.0, 4851.0, 89068.0, 938777.0, 11754.0, 1777.0, 447.0, 153.0, 84.0, 40.0, 33.0, 31.0, 20.0, 13.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03436279296875, -0.03318643569946289, -0.03201007843017578, -0.030833721160888672, -0.029657363891601562, -0.028481006622314453, -0.027304649353027344, -0.026128292083740234, -0.024951934814453125, -0.023775577545166016, -0.022599220275878906, -0.021422863006591797, -0.020246505737304688, -0.019070148468017578, -0.01789379119873047, -0.01671743392944336, -0.01554107666015625, -0.01436471939086914, -0.013188362121582031, -0.012012004852294922, -0.010835647583007812, -0.009659290313720703, -0.008482933044433594, -0.007306575775146484, -0.006130218505859375, -0.004953861236572266, -0.0037775039672851562, -0.002601146697998047, -0.0014247894287109375, -0.0002484321594238281, 0.0009279251098632812, 0.0021042823791503906, 0.0032806396484375, 0.004456996917724609, 0.005633354187011719, 0.006809711456298828, 0.007986068725585938, 0.009162425994873047, 0.010338783264160156, 0.011515140533447266, 0.012691497802734375, 0.013867855072021484, 0.015044212341308594, 0.016220569610595703, 0.017396926879882812, 0.018573284149169922, 0.01974964141845703, 0.02092599868774414, 0.02210235595703125, 0.02327871322631836, 0.02445507049560547, 0.025631427764892578, 0.026807785034179688, 0.027984142303466797, 0.029160499572753906, 0.030336856842041016, 0.031513214111328125, 0.032689571380615234, 0.033865928649902344, 0.03504228591918945, 0.03621864318847656, 0.03739500045776367, 0.03857135772705078, 0.03974771499633789, 0.040924072265625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 3.0, 14.0, 21.0, 22.0, 33.0, 45.0, 66.0, 98.0, 138.0, 132.0, 115.0, 90.0, 55.0, 51.0, 30.0, 25.0, 14.0, 18.0, 8.0, 5.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000148773193359375, -0.00014458410441875458, -0.00014039501547813416, -0.00013620592653751373, -0.0001320168375968933, -0.0001278277486562729, -0.00012363865971565247, -0.00011944957077503204, -0.00011526048183441162, -0.0001110713928937912, -0.00010688230395317078, -0.00010269321501255035, -9.850412607192993e-05, -9.431503713130951e-05, -9.012594819068909e-05, -8.593685925006866e-05, -8.174777030944824e-05, -7.755868136882782e-05, -7.33695924282074e-05, -6.918050348758698e-05, -6.499141454696655e-05, -6.080232560634613e-05, -5.661323666572571e-05, -5.2424147725105286e-05, -4.823505878448486e-05, -4.404596984386444e-05, -3.985688090324402e-05, -3.5667791962623596e-05, -3.1478703022003174e-05, -2.728961408138275e-05, -2.310052514076233e-05, -1.8911436200141907e-05, -1.4722347259521484e-05, -1.0533258318901062e-05, -6.34416937828064e-06, -2.1550804376602173e-06, 2.034008502960205e-06, 6.2230974435806274e-06, 1.041218638420105e-05, 1.4601275324821472e-05, 1.8790364265441895e-05, 2.2979453206062317e-05, 2.716854214668274e-05, 3.135763108730316e-05, 3.5546720027923584e-05, 3.9735808968544006e-05, 4.392489790916443e-05, 4.811398684978485e-05, 5.2303075790405273e-05, 5.6492164731025696e-05, 6.068125367164612e-05, 6.487034261226654e-05, 6.905943155288696e-05, 7.324852049350739e-05, 7.743760943412781e-05, 8.162669837474823e-05, 8.581578731536865e-05, 9.000487625598907e-05, 9.41939651966095e-05, 9.838305413722992e-05, 0.00010257214307785034, 0.00010676123201847076, 0.00011095032095909119, 0.00011513940989971161, 0.00011932849884033203]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 5.0, 10.0, 7.0, 17.0, 11.0, 20.0, 29.0, 19.0, 47.0, 50.0, 82.0, 147.0, 393.0, 5009.0, 1010823.0, 30473.0, 842.0, 184.0, 107.0, 67.0, 49.0, 31.0, 28.0, 22.0, 9.0, 14.0, 22.0, 8.0, 8.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0235748291015625, -0.02269148826599121, -0.021808147430419922, -0.020924806594848633, -0.020041465759277344, -0.019158124923706055, -0.018274784088134766, -0.017391443252563477, -0.016508102416992188, -0.015624761581420898, -0.01474142074584961, -0.01385807991027832, -0.012974739074707031, -0.012091398239135742, -0.011208057403564453, -0.010324716567993164, -0.009441375732421875, -0.008558034896850586, -0.007674694061279297, -0.006791353225708008, -0.005908012390136719, -0.00502467155456543, -0.004141330718994141, -0.0032579898834228516, -0.0023746490478515625, -0.0014913082122802734, -0.0006079673767089844, 0.0002753734588623047, 0.0011587142944335938, 0.002042055130004883, 0.002925395965576172, 0.003808736801147461, 0.00469207763671875, 0.005575418472290039, 0.006458759307861328, 0.007342100143432617, 0.008225440979003906, 0.009108781814575195, 0.009992122650146484, 0.010875463485717773, 0.011758804321289062, 0.012642145156860352, 0.01352548599243164, 0.01440882682800293, 0.015292167663574219, 0.016175508499145508, 0.017058849334716797, 0.017942190170288086, 0.018825531005859375, 0.019708871841430664, 0.020592212677001953, 0.021475553512573242, 0.02235889434814453, 0.02324223518371582, 0.02412557601928711, 0.0250089168548584, 0.025892257690429688, 0.026775598526000977, 0.027658939361572266, 0.028542280197143555, 0.029425621032714844, 0.030308961868286133, 0.031192302703857422, 0.03207564353942871, 0.032958984375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 3.0, 5.0, 2.0, 8.0, 7.0, 15.0, 9.0, 17.0, 23.0, 14.0, 35.0, 24.0, 41.0, 44.0, 54.0, 92.0, 120.0, 113.0, 83.0, 48.0, 54.0, 35.0, 37.0, 27.0, 11.0, 19.0, 11.0, 7.0, 16.0, 8.0, 9.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003673553466796875, -0.0035366415977478027, -0.0033997297286987305, -0.003262817859649658, -0.003125905990600586, -0.0029889941215515137, -0.0028520822525024414, -0.002715170383453369, -0.002578258514404297, -0.0024413466453552246, -0.0023044347763061523, -0.00216752290725708, -0.002030611038208008, -0.0018936991691589355, -0.0017567873001098633, -0.001619875431060791, -0.0014829635620117188, -0.0013460516929626465, -0.0012091398239135742, -0.001072227954864502, -0.0009353160858154297, -0.0007984042167663574, -0.0006614923477172852, -0.0005245804786682129, -0.0003876686096191406, -0.00025075674057006836, -0.0001138448715209961, 2.3066997528076172e-05, 0.00015997886657714844, 0.0002968907356262207, 0.00043380260467529297, 0.0005707144737243652, 0.0007076263427734375, 0.0008445382118225098, 0.000981450080871582, 0.0011183619499206543, 0.0012552738189697266, 0.0013921856880187988, 0.001529097557067871, 0.0016660094261169434, 0.0018029212951660156, 0.0019398331642150879, 0.00207674503326416, 0.0022136569023132324, 0.0023505687713623047, 0.002487480640411377, 0.0026243925094604492, 0.0027613043785095215, 0.0028982162475585938, 0.003035128116607666, 0.0031720399856567383, 0.0033089518547058105, 0.003445863723754883, 0.003582775592803955, 0.0037196874618530273, 0.0038565993309020996, 0.003993511199951172, 0.004130423069000244, 0.004267334938049316, 0.004404246807098389, 0.004541158676147461, 0.004678070545196533, 0.0048149824142456055, 0.004951894283294678, 0.00508880615234375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 11.0, 57.0, 345.0, 495.0, 82.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2985553741455078, -0.29031455516815186, -0.2820737659931183, -0.27383294701576233, -0.26559212803840637, -0.2573513388633728, -0.24911051988601685, -0.2408697009086609, -0.23262889683246613, -0.22438809275627136, -0.2161472737789154, -0.20790646970272064, -0.19966566562652588, -0.19142484664916992, -0.18318404257297516, -0.1749432384967804, -0.16670241951942444, -0.15846161544322968, -0.15022079646587372, -0.14197999238967896, -0.133739173412323, -0.12549836933612823, -0.11725756525993347, -0.10901675373315811, -0.10077594220638275, -0.09253513067960739, -0.08429431915283203, -0.07605351507663727, -0.06781270354986191, -0.05957189202308655, -0.051331084221601486, -0.043090276420116425, -0.03484943509101868, -0.026608625426888466, -0.018367815762758255, -0.010127006098628044, -0.0018861964344978333, 0.006354615092277527, 0.014595422893762589, 0.02283623069524765, 0.03107704222202301, 0.03931785374879837, 0.04755866155028343, 0.055799469351768494, 0.06404028087854385, 0.07228109240531921, 0.08052189648151398, 0.08876270800828934, 0.0970035195350647, 0.10524433106184006, 0.11348514258861542, 0.12172594666481018, 0.12996676564216614, 0.1382075697183609, 0.14644837379455566, 0.15468919277191162, 0.16292999684810638, 0.17117080092430115, 0.1794116199016571, 0.18765242397785187, 0.19589322805404663, 0.2041340470314026, 0.21237485110759735, 0.22061565518379211, 0.22885647416114807]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 2.0, 2.0, 4.0, 9.0, 6.0, 2.0, 15.0, 11.0, 14.0, 21.0, 19.0, 24.0, 23.0, 39.0, 37.0, 47.0, 36.0, 55.0, 44.0, 49.0, 44.0, 56.0, 52.0, 40.0, 48.0, 49.0, 42.0, 28.0, 25.0, 23.0, 25.0, 21.0, 20.0, 14.0, 12.0, 13.0, 14.0, 6.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.055844008922576904, -0.05409380793571472, -0.05234360694885254, -0.05059340223670006, -0.048843201249837875, -0.04709300026297569, -0.04534279555082321, -0.04359259456396103, -0.041842393577098846, -0.040092192590236664, -0.03834199160337448, -0.036591786891222, -0.03484158590435982, -0.033091384917497635, -0.031341180205345154, -0.02959097921848297, -0.02784077823162079, -0.026090577244758606, -0.024340374395251274, -0.022590171545743942, -0.02083997055888176, -0.019089769572019577, -0.017339566722512245, -0.015589364804327488, -0.01383916288614273, -0.012088960967957973, -0.010338759049773216, -0.008588557131588459, -0.006838355213403702, -0.0050881532952189445, -0.0033379513770341873, -0.00158774945884943, 0.00016245245933532715, 0.0019126543775200844, 0.0036628562957048416, 0.005413058213889599, 0.007163260132074356, 0.008913462050259113, 0.01066366396844387, 0.012413865886628628, 0.014164067804813385, 0.015914268791675568, 0.0176644716411829, 0.01941467449069023, 0.021164875477552414, 0.022915076464414597, 0.02466527931392193, 0.02641548216342926, 0.028165683150291443, 0.029915884137153625, 0.03166608512401581, 0.03341628983616829, 0.03516649082303047, 0.036916691809892654, 0.038666896522045135, 0.04041709750890732, 0.0421672984957695, 0.04391749948263168, 0.045667700469493866, 0.04741790518164635, 0.04916810616850853, 0.05091830715537071, 0.05266851186752319, 0.054418712854385376, 0.05616891384124756]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 3.0, 7.0, 10.0, 15.0, 48.0, 104.0, 362.0, 3037.0, 4155366.0, 33491.0, 1346.0, 292.0, 99.0, 39.0, 17.0, 9.0, 10.0, 8.0, 8.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11883544921875, -0.11440372467041016, -0.10997200012207031, -0.10554027557373047, -0.10110855102539062, -0.09667682647705078, -0.09224510192871094, -0.0878133773803711, -0.08338165283203125, -0.0789499282836914, -0.07451820373535156, -0.07008647918701172, -0.06565475463867188, -0.06122303009033203, -0.05679130554199219, -0.052359580993652344, -0.0479278564453125, -0.043496131896972656, -0.03906440734863281, -0.03463268280029297, -0.030200958251953125, -0.02576923370361328, -0.021337509155273438, -0.016905784606933594, -0.01247406005859375, -0.008042335510253906, -0.0036106109619140625, 0.0008211135864257812, 0.005252838134765625, 0.009684562683105469, 0.014116287231445312, 0.018548011779785156, 0.022979736328125, 0.027411460876464844, 0.03184318542480469, 0.03627490997314453, 0.040706634521484375, 0.04513835906982422, 0.04957008361816406, 0.054001808166503906, 0.05843353271484375, 0.0628652572631836, 0.06729698181152344, 0.07172870635986328, 0.07616043090820312, 0.08059215545654297, 0.08502388000488281, 0.08945560455322266, 0.0938873291015625, 0.09831905364990234, 0.10275077819824219, 0.10718250274658203, 0.11161422729492188, 0.11604595184326172, 0.12047767639160156, 0.1249094009399414, 0.12934112548828125, 0.1337728500366211, 0.13820457458496094, 0.14263629913330078, 0.14706802368164062, 0.15149974822998047, 0.1559314727783203, 0.16036319732666016, 0.164794921875]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 9.0, 22.0, 54.0, 139.0, 305.0, 272.0, 109.0, 47.0, 18.0, 13.0, 5.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0160369873046875, -0.015441656112670898, -0.014846324920654297, -0.014250993728637695, -0.013655662536621094, -0.013060331344604492, -0.01246500015258789, -0.011869668960571289, -0.011274337768554688, -0.010679006576538086, -0.010083675384521484, -0.009488344192504883, -0.008893013000488281, -0.00829768180847168, -0.007702350616455078, -0.0071070194244384766, -0.006511688232421875, -0.0059163570404052734, -0.005321025848388672, -0.00472569465637207, -0.004130363464355469, -0.003535032272338867, -0.0029397010803222656, -0.002344369888305664, -0.0017490386962890625, -0.001153707504272461, -0.0005583763122558594, 3.695487976074219e-05, 0.0006322860717773438, 0.0012276172637939453, 0.0018229484558105469, 0.0024182796478271484, 0.00301361083984375, 0.0036089420318603516, 0.004204273223876953, 0.004799604415893555, 0.005394935607910156, 0.005990266799926758, 0.006585597991943359, 0.007180929183959961, 0.0077762603759765625, 0.008371591567993164, 0.008966922760009766, 0.009562253952026367, 0.010157585144042969, 0.01075291633605957, 0.011348247528076172, 0.011943578720092773, 0.012538909912109375, 0.013134241104125977, 0.013729572296142578, 0.01432490348815918, 0.014920234680175781, 0.015515565872192383, 0.016110897064208984, 0.016706228256225586, 0.017301559448242188, 0.01789689064025879, 0.01849222183227539, 0.019087553024291992, 0.019682884216308594, 0.020278215408325195, 0.020873546600341797, 0.0214688777923584, 0.022064208984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 3.0, 13.0, 11.0, 19.0, 34.0, 69.0, 110.0, 317.0, 620.0, 1597.0, 6343.0, 136290.0, 3988130.0, 54024.0, 4246.0, 1287.0, 552.0, 251.0, 146.0, 86.0, 39.0, 33.0, 17.0, 11.0, 13.0, 1.0, 4.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.049957275390625, -0.048415184020996094, -0.04687309265136719, -0.04533100128173828, -0.043788909912109375, -0.04224681854248047, -0.04070472717285156, -0.039162635803222656, -0.03762054443359375, -0.036078453063964844, -0.03453636169433594, -0.03299427032470703, -0.031452178955078125, -0.02991008758544922, -0.028367996215820312, -0.026825904846191406, -0.0252838134765625, -0.023741722106933594, -0.022199630737304688, -0.02065753936767578, -0.019115447998046875, -0.01757335662841797, -0.016031265258789062, -0.014489173889160156, -0.01294708251953125, -0.011404991149902344, -0.009862899780273438, -0.008320808410644531, -0.006778717041015625, -0.005236625671386719, -0.0036945343017578125, -0.0021524429321289062, -0.0006103515625, 0.0009317398071289062, 0.0024738311767578125, 0.004015922546386719, 0.005558013916015625, 0.007100105285644531, 0.008642196655273438, 0.010184288024902344, 0.01172637939453125, 0.013268470764160156, 0.014810562133789062, 0.01635265350341797, 0.017894744873046875, 0.01943683624267578, 0.020978927612304688, 0.022521018981933594, 0.0240631103515625, 0.025605201721191406, 0.027147293090820312, 0.02868938446044922, 0.030231475830078125, 0.03177356719970703, 0.03331565856933594, 0.034857749938964844, 0.03639984130859375, 0.037941932678222656, 0.03948402404785156, 0.04102611541748047, 0.042568206787109375, 0.04411029815673828, 0.04565238952636719, 0.047194480895996094, 0.048736572265625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 4.0, 5.0, 9.0, 7.0, 15.0, 21.0, 53.0, 63.0, 100.0, 170.0, 233.0, 442.0, 809.0, 750.0, 486.0, 336.0, 210.0, 116.0, 76.0, 52.0, 50.0, 26.0, 11.0, 9.0, 5.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01318359375, -0.012743949890136719, -0.012304306030273438, -0.011864662170410156, -0.011425018310546875, -0.010985374450683594, -0.010545730590820312, -0.010106086730957031, -0.00966644287109375, -0.009226799011230469, -0.008787155151367188, -0.008347511291503906, -0.007907867431640625, -0.007468223571777344, -0.0070285797119140625, -0.006588935852050781, -0.0061492919921875, -0.005709648132324219, -0.0052700042724609375, -0.004830360412597656, -0.004390716552734375, -0.003951072692871094, -0.0035114288330078125, -0.0030717849731445312, -0.00263214111328125, -0.0021924972534179688, -0.0017528533935546875, -0.0013132095336914062, -0.000873565673828125, -0.00043392181396484375, 5.7220458984375e-06, 0.00044536590576171875, 0.000885009765625, 0.0013246536254882812, 0.0017642974853515625, 0.0022039413452148438, 0.002643585205078125, 0.0030832290649414062, 0.0035228729248046875, 0.003962516784667969, 0.00440216064453125, 0.004841804504394531, 0.0052814483642578125, 0.005721092224121094, 0.006160736083984375, 0.006600379943847656, 0.0070400238037109375, 0.007479667663574219, 0.0079193115234375, 0.008358955383300781, 0.008798599243164062, 0.009238243103027344, 0.009677886962890625, 0.010117530822753906, 0.010557174682617188, 0.010996818542480469, 0.01143646240234375, 0.011876106262207031, 0.012315750122070312, 0.012755393981933594, 0.013195037841796875, 0.013634681701660156, 0.014074325561523438, 0.014513969421386719, 0.01495361328125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 29.0, 647.0, 309.0, 22.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4934025704860687, -0.4796161949634552, -0.4658298194408417, -0.45204344391822815, -0.43825703859329224, -0.4244706630706787, -0.4106842875480652, -0.39689791202545166, -0.38311153650283813, -0.3693251609802246, -0.3555387854576111, -0.34175240993499756, -0.32796603441238403, -0.3141796588897705, -0.3003932535648346, -0.28660687804222107, -0.27282050251960754, -0.259034126996994, -0.2452477514743805, -0.23146136105060577, -0.21767498552799225, -0.20388861000537872, -0.190102219581604, -0.17631584405899048, -0.16252946853637695, -0.14874309301376343, -0.1349567174911499, -0.12117032706737518, -0.10738395154476166, -0.09359757602214813, -0.07981119304895401, -0.06602481007575989, -0.052238404750823975, -0.03845202550292015, -0.024665646255016327, -0.010879267007112503, 0.002907112240791321, 0.016693487763404846, 0.03047987073659897, 0.04426625370979309, 0.058052629232406616, 0.07183900475502014, 0.08562538772821426, 0.09941177070140839, 0.11319814622402191, 0.12698452174663544, 0.14077091217041016, 0.15455728769302368, 0.1683436632156372, 0.18213003873825073, 0.19591641426086426, 0.20970280468463898, 0.2234891802072525, 0.23727555572986603, 0.25106194615364075, 0.2648483216762543, 0.2786346971988678, 0.2924210727214813, 0.30620744824409485, 0.3199938237667084, 0.3337802290916443, 0.3475666046142578, 0.36135298013687134, 0.37513935565948486, 0.3889257311820984]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 6.0, 2.0, 5.0, 10.0, 10.0, 13.0, 11.0, 14.0, 21.0, 16.0, 17.0, 22.0, 29.0, 30.0, 30.0, 28.0, 45.0, 37.0, 57.0, 51.0, 43.0, 39.0, 41.0, 33.0, 41.0, 36.0, 31.0, 48.0, 27.0, 30.0, 25.0, 19.0, 18.0, 21.0, 17.0, 14.0, 12.0, 9.0, 12.0, 13.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.04567974805831909, -0.04443579912185669, -0.043191853910684586, -0.04194790869951248, -0.04070395976305008, -0.03946001082658768, -0.03821606561541557, -0.03697212040424347, -0.03572817146778107, -0.034484222531318665, -0.03324027732014656, -0.03199633210897446, -0.030752383172512054, -0.0295084360986948, -0.028264489024877548, -0.027020541951060295, -0.025776594877243042, -0.02453264780342579, -0.023288700729608536, -0.022044753655791283, -0.02080080658197403, -0.019556859508156776, -0.018312912434339523, -0.01706896536052227, -0.015825018286705017, -0.014581071212887764, -0.01333712413907051, -0.012093177065253258, -0.010849229991436005, -0.009605282917618752, -0.008361335843801498, -0.007117388769984245, -0.005873441696166992, -0.004629494622349739, -0.003385547548532486, -0.002141600474715233, -0.0008976534008979797, 0.0003462936729192734, 0.0015902407467365265, 0.0028341878205537796, 0.004078134894371033, 0.005322081968188286, 0.006566029042005539, 0.007809976115822792, 0.009053923189640045, 0.010297870263457298, 0.011541817337274551, 0.012785764411091805, 0.014029711484909058, 0.01527365855872631, 0.016517605632543564, 0.017761552706360817, 0.01900549978017807, 0.020249446853995323, 0.021493393927812576, 0.02273734100162983, 0.023981288075447083, 0.025225235149264336, 0.02646918222308159, 0.027713129296898842, 0.028957076370716095, 0.030201023444533348, 0.0314449705183506, 0.032688915729522705, 0.03393286466598511]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 13.0, 8.0, 28.0, 13.0, 36.0, 26.0, 45.0, 53.0, 75.0, 94.0, 128.0, 202.0, 328.0, 585.0, 1344.0, 6036.0, 94454.0, 913329.0, 26274.0, 3150.0, 934.0, 442.0, 257.0, 179.0, 133.0, 103.0, 63.0, 48.0, 32.0, 28.0, 24.0, 17.0, 14.0, 8.0, 14.0, 9.0, 4.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0], "bins": [-0.10711669921875, -0.10416698455810547, -0.10121726989746094, -0.0982675552368164, -0.09531784057617188, -0.09236812591552734, -0.08941841125488281, -0.08646869659423828, -0.08351898193359375, -0.08056926727294922, -0.07761955261230469, -0.07466983795166016, -0.07172012329101562, -0.0687704086303711, -0.06582069396972656, -0.06287097930908203, -0.0599212646484375, -0.05697154998779297, -0.05402183532714844, -0.051072120666503906, -0.048122406005859375, -0.045172691345214844, -0.04222297668457031, -0.03927326202392578, -0.03632354736328125, -0.03337383270263672, -0.030424118041992188, -0.027474403381347656, -0.024524688720703125, -0.021574974060058594, -0.018625259399414062, -0.01567554473876953, -0.012725830078125, -0.009776115417480469, -0.0068264007568359375, -0.0038766860961914062, -0.000926971435546875, 0.0020227432250976562, 0.0049724578857421875, 0.007922172546386719, 0.01087188720703125, 0.013821601867675781, 0.016771316528320312, 0.019721031188964844, 0.022670745849609375, 0.025620460510253906, 0.028570175170898438, 0.03151988983154297, 0.0344696044921875, 0.03741931915283203, 0.04036903381347656, 0.043318748474121094, 0.046268463134765625, 0.049218177795410156, 0.05216789245605469, 0.05511760711669922, 0.05806732177734375, 0.06101703643798828, 0.06396675109863281, 0.06691646575927734, 0.06986618041992188, 0.0728158950805664, 0.07576560974121094, 0.07871532440185547, 0.0816650390625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 8.0, 12.0, 36.0, 101.0, 195.0, 330.0, 174.0, 83.0, 31.0, 15.0, 13.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.016021728515625, -0.015438556671142578, -0.014855384826660156, -0.014272212982177734, -0.013689041137695312, -0.01310586929321289, -0.012522697448730469, -0.011939525604248047, -0.011356353759765625, -0.010773181915283203, -0.010190010070800781, -0.00960683822631836, -0.009023666381835938, -0.008440494537353516, -0.007857322692871094, -0.007274150848388672, -0.00669097900390625, -0.006107807159423828, -0.005524635314941406, -0.004941463470458984, -0.0043582916259765625, -0.0037751197814941406, -0.0031919479370117188, -0.002608776092529297, -0.002025604248046875, -0.0014424324035644531, -0.0008592605590820312, -0.0002760887145996094, 0.0003070831298828125, 0.0008902549743652344, 0.0014734268188476562, 0.002056598663330078, 0.0026397705078125, 0.003222942352294922, 0.0038061141967773438, 0.004389286041259766, 0.0049724578857421875, 0.005555629730224609, 0.006138801574707031, 0.006721973419189453, 0.007305145263671875, 0.007888317108154297, 0.008471488952636719, 0.00905466079711914, 0.009637832641601562, 0.010221004486083984, 0.010804176330566406, 0.011387348175048828, 0.01197052001953125, 0.012553691864013672, 0.013136863708496094, 0.013720035552978516, 0.014303207397460938, 0.01488637924194336, 0.015469551086425781, 0.016052722930908203, 0.016635894775390625, 0.017219066619873047, 0.01780223846435547, 0.01838541030883789, 0.018968582153320312, 0.019551753997802734, 0.020134925842285156, 0.020718097686767578, 0.02130126953125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 9.0, 4.0, 6.0, 7.0, 12.0, 12.0, 19.0, 16.0, 24.0, 38.0, 46.0, 73.0, 84.0, 116.0, 140.0, 167.0, 263.0, 393.0, 662.0, 1551.0, 5427.0, 34319.0, 512909.0, 452682.0, 31023.0, 5035.0, 1453.0, 620.0, 381.0, 251.0, 217.0, 140.0, 104.0, 93.0, 64.0, 46.0, 36.0, 25.0, 25.0, 17.0, 13.0, 11.0, 7.0, 6.0, 6.0, 0.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0443115234375, -0.04278230667114258, -0.041253089904785156, -0.039723873138427734, -0.03819465637207031, -0.03666543960571289, -0.03513622283935547, -0.03360700607299805, -0.032077789306640625, -0.030548572540283203, -0.02901935577392578, -0.02749013900756836, -0.025960922241210938, -0.024431705474853516, -0.022902488708496094, -0.021373271942138672, -0.01984405517578125, -0.018314838409423828, -0.016785621643066406, -0.015256404876708984, -0.013727188110351562, -0.01219797134399414, -0.010668754577636719, -0.009139537811279297, -0.007610321044921875, -0.006081104278564453, -0.004551887512207031, -0.0030226707458496094, -0.0014934539794921875, 3.5762786865234375e-05, 0.0015649795532226562, 0.003094196319580078, 0.0046234130859375, 0.006152629852294922, 0.007681846618652344, 0.009211063385009766, 0.010740280151367188, 0.01226949691772461, 0.013798713684082031, 0.015327930450439453, 0.016857147216796875, 0.018386363983154297, 0.01991558074951172, 0.02144479751586914, 0.022974014282226562, 0.024503231048583984, 0.026032447814941406, 0.027561664581298828, 0.02909088134765625, 0.030620098114013672, 0.032149314880371094, 0.033678531646728516, 0.03520774841308594, 0.03673696517944336, 0.03826618194580078, 0.0397953987121582, 0.041324615478515625, 0.04285383224487305, 0.04438304901123047, 0.04591226577758789, 0.04744148254394531, 0.048970699310302734, 0.050499916076660156, 0.05202913284301758, 0.053558349609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 3.0, 3.0, 8.0, 9.0, 9.0, 20.0, 13.0, 18.0, 24.0, 21.0, 23.0, 34.0, 33.0, 43.0, 37.0, 45.0, 50.0, 63.0, 68.0, 49.0, 68.0, 52.0, 49.0, 37.0, 31.0, 31.0, 25.0, 32.0, 23.0, 10.0, 16.0, 11.0, 15.0, 10.0, 7.0, 5.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.015838623046875, -0.015334367752075195, -0.01483011245727539, -0.014325857162475586, -0.013821601867675781, -0.013317346572875977, -0.012813091278076172, -0.012308835983276367, -0.011804580688476562, -0.011300325393676758, -0.010796070098876953, -0.010291814804077148, -0.009787559509277344, -0.009283304214477539, -0.008779048919677734, -0.00827479362487793, -0.007770538330078125, -0.00726628303527832, -0.006762027740478516, -0.006257772445678711, -0.005753517150878906, -0.0052492618560791016, -0.004745006561279297, -0.004240751266479492, -0.0037364959716796875, -0.003232240676879883, -0.002727985382080078, -0.0022237300872802734, -0.0017194747924804688, -0.001215219497680664, -0.0007109642028808594, -0.0002067089080810547, 0.00029754638671875, 0.0008018016815185547, 0.0013060569763183594, 0.001810312271118164, 0.0023145675659179688, 0.0028188228607177734, 0.003323078155517578, 0.003827333450317383, 0.0043315887451171875, 0.004835844039916992, 0.005340099334716797, 0.0058443546295166016, 0.006348609924316406, 0.006852865219116211, 0.007357120513916016, 0.00786137580871582, 0.008365631103515625, 0.00886988639831543, 0.009374141693115234, 0.009878396987915039, 0.010382652282714844, 0.010886907577514648, 0.011391162872314453, 0.011895418167114258, 0.012399673461914062, 0.012903928756713867, 0.013408184051513672, 0.013912439346313477, 0.014416694641113281, 0.014920949935913086, 0.01542520523071289, 0.015929460525512695, 0.0164337158203125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 7.0, 8.0, 11.0, 12.0, 17.0, 17.0, 22.0, 43.0, 58.0, 111.0, 178.0, 379.0, 850.0, 2795.0, 14112.0, 218573.0, 777519.0, 27291.0, 4353.0, 1204.0, 427.0, 209.0, 116.0, 73.0, 54.0, 41.0, 21.0, 15.0, 11.0, 8.0, 7.0, 2.0, 7.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03778076171875, -0.03656816482543945, -0.035355567932128906, -0.03414297103881836, -0.03293037414550781, -0.031717777252197266, -0.03050518035888672, -0.029292583465576172, -0.028079986572265625, -0.026867389678955078, -0.02565479278564453, -0.024442195892333984, -0.023229598999023438, -0.02201700210571289, -0.020804405212402344, -0.019591808319091797, -0.01837921142578125, -0.017166614532470703, -0.015954017639160156, -0.01474142074584961, -0.013528823852539062, -0.012316226959228516, -0.011103630065917969, -0.009891033172607422, -0.008678436279296875, -0.007465839385986328, -0.006253242492675781, -0.005040645599365234, -0.0038280487060546875, -0.0026154518127441406, -0.0014028549194335938, -0.00019025802612304688, 0.0010223388671875, 0.002234935760498047, 0.0034475326538085938, 0.004660129547119141, 0.0058727264404296875, 0.007085323333740234, 0.008297920227050781, 0.009510517120361328, 0.010723114013671875, 0.011935710906982422, 0.013148307800292969, 0.014360904693603516, 0.015573501586914062, 0.01678609848022461, 0.017998695373535156, 0.019211292266845703, 0.02042388916015625, 0.021636486053466797, 0.022849082946777344, 0.02406167984008789, 0.025274276733398438, 0.026486873626708984, 0.02769947052001953, 0.028912067413330078, 0.030124664306640625, 0.03133726119995117, 0.03254985809326172, 0.033762454986572266, 0.03497505187988281, 0.03618764877319336, 0.037400245666503906, 0.03861284255981445, 0.039825439453125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 5.0, 2.0, 6.0, 9.0, 5.0, 11.0, 17.0, 23.0, 32.0, 49.0, 80.0, 108.0, 146.0, 140.0, 99.0, 61.0, 49.0, 44.0, 21.0, 22.0, 7.0, 8.0, 11.0, 11.0, 3.0, 6.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.565187454223633e-05, -8.17691907286644e-05, -7.788650691509247e-05, -7.400382310152054e-05, -7.012113928794861e-05, -6.623845547437668e-05, -6.235577166080475e-05, -5.847308784723282e-05, -5.459040403366089e-05, -5.070772022008896e-05, -4.682503640651703e-05, -4.29423525929451e-05, -3.905966877937317e-05, -3.517698496580124e-05, -3.129430115222931e-05, -2.741161733865738e-05, -2.352893352508545e-05, -1.964624971151352e-05, -1.576356589794159e-05, -1.188088208436966e-05, -7.99819827079773e-06, -4.1155144572257996e-06, -2.3283064365386963e-07, 3.6498531699180603e-06, 7.53253698348999e-06, 1.141522079706192e-05, 1.529790461063385e-05, 1.918058842420578e-05, 2.306327223777771e-05, 2.694595605134964e-05, 3.082863986492157e-05, 3.47113236784935e-05, 3.859400749206543e-05, 4.247669130563736e-05, 4.635937511920929e-05, 5.024205893278122e-05, 5.412474274635315e-05, 5.800742655992508e-05, 6.189011037349701e-05, 6.577279418706894e-05, 6.965547800064087e-05, 7.35381618142128e-05, 7.742084562778473e-05, 8.130352944135666e-05, 8.518621325492859e-05, 8.906889706850052e-05, 9.295158088207245e-05, 9.683426469564438e-05, 0.00010071694850921631, 0.00010459963232278824, 0.00010848231613636017, 0.0001123649999499321, 0.00011624768376350403, 0.00012013036757707596, 0.0001240130513906479, 0.00012789573520421982, 0.00013177841901779175, 0.00013566110283136368, 0.0001395437866449356, 0.00014342647045850754, 0.00014730915427207947, 0.0001511918380856514, 0.00015507452189922333, 0.00015895720571279526, 0.0001628398895263672]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 6.0, 5.0, 5.0, 6.0, 9.0, 13.0, 25.0, 29.0, 44.0, 66.0, 98.0, 190.0, 318.0, 732.0, 3193.0, 31776.0, 939788.0, 65757.0, 4624.0, 955.0, 335.0, 201.0, 117.0, 78.0, 54.0, 35.0, 30.0, 19.0, 21.0, 11.0, 5.0, 7.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033782958984375, -0.03274679183959961, -0.03171062469482422, -0.030674457550048828, -0.029638290405273438, -0.028602123260498047, -0.027565956115722656, -0.026529788970947266, -0.025493621826171875, -0.024457454681396484, -0.023421287536621094, -0.022385120391845703, -0.021348953247070312, -0.020312786102294922, -0.01927661895751953, -0.01824045181274414, -0.01720428466796875, -0.01616811752319336, -0.015131950378417969, -0.014095783233642578, -0.013059616088867188, -0.012023448944091797, -0.010987281799316406, -0.009951114654541016, -0.008914947509765625, -0.007878780364990234, -0.006842613220214844, -0.005806446075439453, -0.0047702789306640625, -0.003734111785888672, -0.0026979446411132812, -0.0016617774963378906, -0.0006256103515625, 0.0004105567932128906, 0.0014467239379882812, 0.002482891082763672, 0.0035190582275390625, 0.004555225372314453, 0.005591392517089844, 0.006627559661865234, 0.007663726806640625, 0.008699893951416016, 0.009736061096191406, 0.010772228240966797, 0.011808395385742188, 0.012844562530517578, 0.013880729675292969, 0.01491689682006836, 0.01595306396484375, 0.01698923110961914, 0.01802539825439453, 0.019061565399169922, 0.020097732543945312, 0.021133899688720703, 0.022170066833496094, 0.023206233978271484, 0.024242401123046875, 0.025278568267822266, 0.026314735412597656, 0.027350902557373047, 0.028387069702148438, 0.029423236846923828, 0.03045940399169922, 0.03149557113647461, 0.03253173828125]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 4.0, 2.0, 4.0, 6.0, 7.0, 9.0, 13.0, 8.0, 13.0, 9.0, 19.0, 35.0, 43.0, 45.0, 76.0, 94.0, 120.0, 141.0, 90.0, 66.0, 32.0, 31.0, 28.0, 16.0, 12.0, 11.0, 12.0, 11.0, 11.0, 5.0, 5.0, 3.0, 5.0, 3.0, 3.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00778961181640625, -0.007553398609161377, -0.007317185401916504, -0.007080972194671631, -0.006844758987426758, -0.006608545780181885, -0.006372332572937012, -0.006136119365692139, -0.005899906158447266, -0.005663692951202393, -0.0054274797439575195, -0.0051912665367126465, -0.0049550533294677734, -0.0047188401222229, -0.004482626914978027, -0.004246413707733154, -0.004010200500488281, -0.003773987293243408, -0.003537774085998535, -0.003301560878753662, -0.003065347671508789, -0.002829134464263916, -0.002592921257019043, -0.00235670804977417, -0.002120494842529297, -0.0018842816352844238, -0.0016480684280395508, -0.0014118552207946777, -0.0011756420135498047, -0.0009394288063049316, -0.0007032155990600586, -0.00046700239181518555, -0.0002307891845703125, 5.424022674560547e-06, 0.0002416372299194336, 0.00047785043716430664, 0.0007140636444091797, 0.0009502768516540527, 0.0011864900588989258, 0.0014227032661437988, 0.0016589164733886719, 0.001895129680633545, 0.002131342887878418, 0.002367556095123291, 0.002603769302368164, 0.002839982509613037, 0.00307619571685791, 0.003312408924102783, 0.0035486221313476562, 0.0037848353385925293, 0.004021048545837402, 0.004257261753082275, 0.0044934749603271484, 0.0047296881675720215, 0.0049659013748168945, 0.005202114582061768, 0.005438327789306641, 0.005674540996551514, 0.005910754203796387, 0.00614696741104126, 0.006383180618286133, 0.006619393825531006, 0.006855607032775879, 0.007091820240020752, 0.007328033447265625]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 14.0, 167.0, 739.0, 80.0, 11.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8121696710586548, -0.7974826693534851, -0.7827956676483154, -0.768108606338501, -0.7534216046333313, -0.7387346029281616, -0.7240476012229919, -0.7093605995178223, -0.6946735382080078, -0.6799865365028381, -0.6652995347976685, -0.650612473487854, -0.6359254717826843, -0.6212384700775146, -0.606551468372345, -0.5918644666671753, -0.5771774649620056, -0.5624904632568359, -0.5478034615516663, -0.5331164002418518, -0.5184293985366821, -0.5037423968315125, -0.4890553951263428, -0.4743683934211731, -0.45968136191368103, -0.44499436020851135, -0.4303073287010193, -0.4156203269958496, -0.40093332529067993, -0.38624629378318787, -0.3715592920780182, -0.3568722605705261, -0.34218522906303406, -0.3274982273578644, -0.3128111958503723, -0.29812419414520264, -0.28343719244003296, -0.2687501609325409, -0.2540631592273712, -0.23937614262104034, -0.22468912601470947, -0.2100021094083786, -0.19531509280204773, -0.18062809109687805, -0.16594107449054718, -0.1512540578842163, -0.13656705617904663, -0.12188003957271576, -0.10719302296638489, -0.09250600636005402, -0.07781899720430374, -0.06313198804855347, -0.048444971442222595, -0.033757954835891724, -0.01907094568014145, -0.004383936524391174, 0.010303080081939697, 0.02499009296298027, 0.039677105844020844, 0.05436411872506142, 0.06905113160610199, 0.08373814821243286, 0.09842515736818314, 0.11311216652393341, 0.12779918313026428]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 9.0, 20.0, 17.0, 27.0, 29.0, 43.0, 43.0, 63.0, 62.0, 63.0, 53.0, 56.0, 73.0, 58.0, 63.0, 58.0, 46.0, 39.0, 42.0, 27.0, 22.0, 24.0, 22.0, 12.0, 7.0, 4.0, 5.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07898873090744019, -0.07669372111558914, -0.0743987038731575, -0.07210369408130646, -0.06980867683887482, -0.06751366704702377, -0.06521865725517273, -0.06292364001274109, -0.060628630220890045, -0.0583336167037487, -0.05603860318660736, -0.05374359339475632, -0.051448579877614975, -0.04915356636047363, -0.04685855656862259, -0.04456354305148125, -0.042268529534339905, -0.03997351601719856, -0.03767850250005722, -0.03538349270820618, -0.033088479191064835, -0.030793465673923492, -0.0284984540194273, -0.026203442364931107, -0.023908428847789764, -0.021613415330648422, -0.01931840367615223, -0.017023392021656036, -0.014728378504514694, -0.012433365918695927, -0.010138353332877159, -0.007843341678380966, -0.005548328161239624, -0.0032533155754208565, -0.0009583029896020889, 0.0013367095962166786, 0.003631722182035446, 0.005926734767854214, 0.008221747353672981, 0.010516759008169174, 0.012811772525310516, 0.015106785111129284, 0.01740179769694805, 0.019696809351444244, 0.021991822868585587, 0.02428683638572693, 0.02658184804022312, 0.028876859694719315, 0.031171873211860657, 0.033466886729002, 0.03576190024614334, 0.038056910037994385, 0.04035192355513573, 0.04264693707227707, 0.04494194686412811, 0.047236960381269455, 0.0495319738984108, 0.05182698741555214, 0.05412200093269348, 0.056417010724544525, 0.05871202424168587, 0.06100703775882721, 0.06330204755067825, 0.0655970573425293, 0.06789207458496094]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 3.0, 6.0, 17.0, 36.0, 63.0, 187.0, 420.0, 1333.0, 5774.0, 836596.0, 3342253.0, 5120.0, 1349.0, 563.0, 272.0, 123.0, 72.0, 36.0, 17.0, 16.0, 6.0, 8.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05438232421875, -0.052211761474609375, -0.05004119873046875, -0.047870635986328125, -0.0457000732421875, -0.043529510498046875, -0.04135894775390625, -0.039188385009765625, -0.037017822265625, -0.034847259521484375, -0.03267669677734375, -0.030506134033203125, -0.0283355712890625, -0.026165008544921875, -0.02399444580078125, -0.021823883056640625, -0.0196533203125, -0.017482757568359375, -0.01531219482421875, -0.013141632080078125, -0.0109710693359375, -0.008800506591796875, -0.00662994384765625, -0.004459381103515625, -0.002288818359375, -0.000118255615234375, 0.00205230712890625, 0.004222869873046875, 0.0063934326171875, 0.008563995361328125, 0.01073455810546875, 0.012905120849609375, 0.01507568359375, 0.017246246337890625, 0.01941680908203125, 0.021587371826171875, 0.0237579345703125, 0.025928497314453125, 0.02809906005859375, 0.030269622802734375, 0.032440185546875, 0.034610748291015625, 0.03678131103515625, 0.038951873779296875, 0.0411224365234375, 0.043292999267578125, 0.04546356201171875, 0.047634124755859375, 0.0498046875, 0.051975250244140625, 0.05414581298828125, 0.056316375732421875, 0.0584869384765625, 0.060657501220703125, 0.06282806396484375, 0.06499862670898438, 0.067169189453125, 0.06933975219726562, 0.07151031494140625, 0.07368087768554688, 0.0758514404296875, 0.07802200317382812, 0.08019256591796875, 0.08236312866210938, 0.08453369140625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 10.0, 15.0, 38.0, 102.0, 178.0, 276.0, 203.0, 105.0, 40.0, 17.0, 10.0, 8.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.014312744140625, -0.01377415657043457, -0.01323556900024414, -0.012696981430053711, -0.012158393859863281, -0.011619806289672852, -0.011081218719482422, -0.010542631149291992, -0.010004043579101562, -0.009465456008911133, -0.008926868438720703, -0.008388280868530273, -0.007849693298339844, -0.007311105728149414, -0.006772518157958984, -0.006233930587768555, -0.005695343017578125, -0.005156755447387695, -0.004618167877197266, -0.004079580307006836, -0.0035409927368164062, -0.0030024051666259766, -0.002463817596435547, -0.0019252300262451172, -0.0013866424560546875, -0.0008480548858642578, -0.0003094673156738281, 0.00022912025451660156, 0.0007677078247070312, 0.001306295394897461, 0.0018448829650878906, 0.0023834705352783203, 0.00292205810546875, 0.0034606456756591797, 0.003999233245849609, 0.004537820816040039, 0.005076408386230469, 0.0056149959564208984, 0.006153583526611328, 0.006692171096801758, 0.0072307586669921875, 0.007769346237182617, 0.008307933807373047, 0.008846521377563477, 0.009385108947753906, 0.009923696517944336, 0.010462284088134766, 0.011000871658325195, 0.011539459228515625, 0.012078046798706055, 0.012616634368896484, 0.013155221939086914, 0.013693809509277344, 0.014232397079467773, 0.014770984649658203, 0.015309572219848633, 0.015848159790039062, 0.016386747360229492, 0.016925334930419922, 0.01746392250061035, 0.01800251007080078, 0.01854109764099121, 0.01907968521118164, 0.01961827278137207, 0.0201568603515625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 1.0, 5.0, 11.0, 11.0, 13.0, 18.0, 30.0, 39.0, 73.0, 102.0, 173.0, 357.0, 578.0, 1280.0, 3354.0, 14962.0, 273142.0, 3718948.0, 163896.0, 11783.0, 3008.0, 1184.0, 550.0, 312.0, 152.0, 97.0, 68.0, 50.0, 18.0, 21.0, 14.0, 13.0, 7.0, 7.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.032989501953125, -0.0320584774017334, -0.031127452850341797, -0.030196428298950195, -0.029265403747558594, -0.028334379196166992, -0.02740335464477539, -0.02647233009338379, -0.025541305541992188, -0.024610280990600586, -0.023679256439208984, -0.022748231887817383, -0.02181720733642578, -0.02088618278503418, -0.019955158233642578, -0.019024133682250977, -0.018093109130859375, -0.017162084579467773, -0.016231060028076172, -0.01530003547668457, -0.014369010925292969, -0.013437986373901367, -0.012506961822509766, -0.011575937271118164, -0.010644912719726562, -0.009713888168334961, -0.00878286361694336, -0.007851839065551758, -0.006920814514160156, -0.005989789962768555, -0.005058765411376953, -0.0041277408599853516, -0.00319671630859375, -0.0022656917572021484, -0.0013346672058105469, -0.0004036426544189453, 0.0005273818969726562, 0.0014584064483642578, 0.0023894309997558594, 0.003320455551147461, 0.0042514801025390625, 0.005182504653930664, 0.006113529205322266, 0.007044553756713867, 0.007975578308105469, 0.00890660285949707, 0.009837627410888672, 0.010768651962280273, 0.011699676513671875, 0.012630701065063477, 0.013561725616455078, 0.01449275016784668, 0.015423774719238281, 0.016354799270629883, 0.017285823822021484, 0.018216848373413086, 0.019147872924804688, 0.02007889747619629, 0.02100992202758789, 0.021940946578979492, 0.022871971130371094, 0.023802995681762695, 0.024734020233154297, 0.0256650447845459, 0.0265960693359375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 10.0, 11.0, 17.0, 25.0, 25.0, 36.0, 72.0, 89.0, 145.0, 188.0, 285.0, 400.0, 578.0, 592.0, 508.0, 323.0, 253.0, 164.0, 111.0, 86.0, 55.0, 33.0, 21.0, 12.0, 9.0, 10.0, 10.0, 1.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01085662841796875, -0.010440707206726074, -0.010024785995483398, -0.009608864784240723, -0.009192943572998047, -0.008777022361755371, -0.008361101150512695, -0.00794517993927002, -0.007529258728027344, -0.007113337516784668, -0.006697416305541992, -0.006281495094299316, -0.005865573883056641, -0.005449652671813965, -0.005033731460571289, -0.004617810249328613, -0.0042018890380859375, -0.0037859678268432617, -0.003370046615600586, -0.00295412540435791, -0.0025382041931152344, -0.0021222829818725586, -0.0017063617706298828, -0.001290440559387207, -0.0008745193481445312, -0.00045859813690185547, -4.267692565917969e-05, 0.0003732442855834961, 0.0007891654968261719, 0.0012050867080688477, 0.0016210079193115234, 0.0020369291305541992, 0.002452850341796875, 0.0028687715530395508, 0.0032846927642822266, 0.0037006139755249023, 0.004116535186767578, 0.004532456398010254, 0.00494837760925293, 0.0053642988204956055, 0.005780220031738281, 0.006196141242980957, 0.006612062454223633, 0.007027983665466309, 0.007443904876708984, 0.00785982608795166, 0.008275747299194336, 0.008691668510437012, 0.009107589721679688, 0.009523510932922363, 0.009939432144165039, 0.010355353355407715, 0.01077127456665039, 0.011187195777893066, 0.011603116989135742, 0.012019038200378418, 0.012434959411621094, 0.01285088062286377, 0.013266801834106445, 0.013682723045349121, 0.014098644256591797, 0.014514565467834473, 0.014930486679077148, 0.015346407890319824, 0.0157623291015625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 13.0, 71.0, 535.0, 329.0, 45.0, 10.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3723847568035126, -0.3638807535171509, -0.3553767800331116, -0.3468727767467499, -0.3383687734603882, -0.3298647999763489, -0.3213607966899872, -0.3128568232059479, -0.3043528199195862, -0.2958488166332245, -0.2873448431491852, -0.2788408398628235, -0.2703368663787842, -0.2618328630924225, -0.2533288598060608, -0.2448248714208603, -0.2363208830356598, -0.2278168946504593, -0.2193129062652588, -0.2108089029788971, -0.2023049145936966, -0.1938009262084961, -0.1852969229221344, -0.1767929345369339, -0.1682889461517334, -0.1597849577665329, -0.1512809693813324, -0.1427769660949707, -0.1342729777097702, -0.1257689893245697, -0.1172649934887886, -0.10876099765300751, -0.100257009267807, -0.0917530208826065, -0.08324902504682541, -0.07474502921104431, -0.06624104082584381, -0.05773704871535301, -0.04923305660486221, -0.040729064494371414, -0.032225072383880615, -0.023721080273389816, -0.015217088162899017, -0.006713096052408218, 0.0017908960580825806, 0.01029488816857338, 0.01879888027906418, 0.027302872389554977, 0.035806864500045776, 0.044310856610536575, 0.052814848721027374, 0.06131884083151817, 0.06982283294200897, 0.07832682132720947, 0.08683081716299057, 0.09533481299877167, 0.10383880138397217, 0.11234278976917267, 0.12084678560495377, 0.12935078144073486, 0.13785476982593536, 0.14635875821113586, 0.15486276149749756, 0.16336674988269806, 0.17187073826789856]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 6.0, 3.0, 5.0, 5.0, 9.0, 10.0, 12.0, 13.0, 10.0, 11.0, 34.0, 32.0, 34.0, 32.0, 41.0, 42.0, 46.0, 50.0, 48.0, 55.0, 66.0, 67.0, 39.0, 52.0, 42.0, 47.0, 25.0, 46.0, 31.0, 31.0, 12.0, 17.0, 13.0, 7.0, 6.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.06207382678985596, -0.06053691357374191, -0.05900000035762787, -0.057463087141513824, -0.05592617392539978, -0.054389260709285736, -0.05285234749317169, -0.05131543427705765, -0.049778521060943604, -0.04824160784482956, -0.046704694628715515, -0.04516778141260147, -0.04363086819648743, -0.04209395498037338, -0.04055704176425934, -0.039020128548145294, -0.03748321533203125, -0.035946302115917206, -0.03440938889980316, -0.03287247568368912, -0.03133556246757507, -0.02979864925146103, -0.028261736035346985, -0.02672482281923294, -0.025187909603118896, -0.023650996387004852, -0.022114083170890808, -0.020577169954776764, -0.01904025673866272, -0.017503343522548676, -0.01596643030643463, -0.014429517090320587, -0.012892603874206543, -0.011355690658092499, -0.009818777441978455, -0.00828186422586441, -0.006744951009750366, -0.005208037793636322, -0.003671124577522278, -0.0021342113614082336, -0.0005972981452941895, 0.0009396150708198547, 0.002476528286933899, 0.004013441503047943, 0.005550354719161987, 0.0070872679352760315, 0.008624181151390076, 0.01016109436750412, 0.011698007583618164, 0.013234920799732208, 0.014771834015846252, 0.016308747231960297, 0.01784566044807434, 0.019382573664188385, 0.02091948688030243, 0.022456400096416473, 0.023993313312530518, 0.025530226528644562, 0.027067139744758606, 0.02860405296087265, 0.030140966176986694, 0.03167787939310074, 0.03321479260921478, 0.03475170582532883, 0.03628861904144287]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 9.0, 5.0, 13.0, 24.0, 27.0, 42.0, 65.0, 69.0, 119.0, 142.0, 222.0, 364.0, 526.0, 1193.0, 6628.0, 277509.0, 745366.0, 12709.0, 1659.0, 645.0, 405.0, 240.0, 153.0, 109.0, 69.0, 69.0, 41.0, 24.0, 24.0, 18.0, 16.0, 10.0, 5.0, 11.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0806884765625, -0.07845449447631836, -0.07622051239013672, -0.07398653030395508, -0.07175254821777344, -0.0695185661315918, -0.06728458404541016, -0.06505060195922852, -0.06281661987304688, -0.060582637786865234, -0.058348655700683594, -0.05611467361450195, -0.05388069152832031, -0.05164670944213867, -0.04941272735595703, -0.04717874526977539, -0.04494476318359375, -0.04271078109741211, -0.04047679901123047, -0.03824281692504883, -0.03600883483886719, -0.03377485275268555, -0.031540870666503906, -0.029306888580322266, -0.027072906494140625, -0.024838924407958984, -0.022604942321777344, -0.020370960235595703, -0.018136978149414062, -0.015902996063232422, -0.013669013977050781, -0.01143503189086914, -0.0092010498046875, -0.006967067718505859, -0.004733085632324219, -0.002499103546142578, -0.0002651214599609375, 0.001968860626220703, 0.004202842712402344, 0.006436824798583984, 0.008670806884765625, 0.010904788970947266, 0.013138771057128906, 0.015372753143310547, 0.017606735229492188, 0.019840717315673828, 0.02207469940185547, 0.02430868148803711, 0.02654266357421875, 0.02877664566040039, 0.03101062774658203, 0.03324460983276367, 0.03547859191894531, 0.03771257400512695, 0.039946556091308594, 0.042180538177490234, 0.044414520263671875, 0.046648502349853516, 0.048882484436035156, 0.0511164665222168, 0.05335044860839844, 0.05558443069458008, 0.05781841278076172, 0.06005239486694336, 0.062286376953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 17.0, 37.0, 106.0, 186.0, 273.0, 208.0, 95.0, 47.0, 20.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01412200927734375, -0.013590693473815918, -0.013059377670288086, -0.012528061866760254, -0.011996746063232422, -0.01146543025970459, -0.010934114456176758, -0.010402798652648926, -0.009871482849121094, -0.009340167045593262, -0.00880885124206543, -0.008277535438537598, -0.007746219635009766, -0.007214903831481934, -0.0066835880279541016, -0.0061522722244262695, -0.0056209564208984375, -0.0050896406173706055, -0.0045583248138427734, -0.004027009010314941, -0.0034956932067871094, -0.0029643774032592773, -0.0024330615997314453, -0.0019017457962036133, -0.0013704299926757812, -0.0008391141891479492, -0.0003077983856201172, 0.00022351741790771484, 0.0007548332214355469, 0.001286149024963379, 0.001817464828491211, 0.002348780632019043, 0.002880096435546875, 0.003411412239074707, 0.003942728042602539, 0.004474043846130371, 0.005005359649658203, 0.005536675453186035, 0.006067991256713867, 0.006599307060241699, 0.007130622863769531, 0.007661938667297363, 0.008193254470825195, 0.008724570274353027, 0.00925588607788086, 0.009787201881408691, 0.010318517684936523, 0.010849833488464355, 0.011381149291992188, 0.01191246509552002, 0.012443780899047852, 0.012975096702575684, 0.013506412506103516, 0.014037728309631348, 0.01456904411315918, 0.015100359916687012, 0.015631675720214844, 0.016162991523742676, 0.016694307327270508, 0.01722562313079834, 0.017756938934326172, 0.018288254737854004, 0.018819570541381836, 0.019350886344909668, 0.0198822021484375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 4.0, 6.0, 11.0, 14.0, 27.0, 35.0, 53.0, 77.0, 94.0, 152.0, 199.0, 351.0, 664.0, 1375.0, 5066.0, 37235.0, 546443.0, 420638.0, 28758.0, 4332.0, 1325.0, 640.0, 364.0, 218.0, 140.0, 96.0, 52.0, 49.0, 31.0, 24.0, 12.0, 24.0, 16.0, 7.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.042144775390625, -0.040737152099609375, -0.03932952880859375, -0.037921905517578125, -0.0365142822265625, -0.035106658935546875, -0.03369903564453125, -0.032291412353515625, -0.0308837890625, -0.029476165771484375, -0.02806854248046875, -0.026660919189453125, -0.0252532958984375, -0.023845672607421875, -0.02243804931640625, -0.021030426025390625, -0.019622802734375, -0.018215179443359375, -0.01680755615234375, -0.015399932861328125, -0.0139923095703125, -0.012584686279296875, -0.01117706298828125, -0.009769439697265625, -0.00836181640625, -0.006954193115234375, -0.00554656982421875, -0.004138946533203125, -0.0027313232421875, -0.001323699951171875, 8.392333984375e-05, 0.001491546630859375, 0.002899169921875, 0.004306793212890625, 0.00571441650390625, 0.007122039794921875, 0.0085296630859375, 0.009937286376953125, 0.01134490966796875, 0.012752532958984375, 0.01416015625, 0.015567779541015625, 0.01697540283203125, 0.018383026123046875, 0.0197906494140625, 0.021198272705078125, 0.02260589599609375, 0.024013519287109375, 0.025421142578125, 0.026828765869140625, 0.02823638916015625, 0.029644012451171875, 0.0310516357421875, 0.032459259033203125, 0.03386688232421875, 0.035274505615234375, 0.03668212890625, 0.038089752197265625, 0.03949737548828125, 0.040904998779296875, 0.0423126220703125, 0.043720245361328125, 0.04512786865234375, 0.046535491943359375, 0.047943115234375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 7.0, 5.0, 8.0, 6.0, 11.0, 8.0, 10.0, 11.0, 19.0, 26.0, 27.0, 36.0, 45.0, 31.0, 37.0, 39.0, 46.0, 51.0, 46.0, 37.0, 57.0, 54.0, 44.0, 35.0, 41.0, 31.0, 35.0, 26.0, 27.0, 29.0, 15.0, 17.0, 18.0, 14.0, 7.0, 7.0, 6.0, 10.0, 7.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01513671875, -0.014740467071533203, -0.014344215393066406, -0.01394796371459961, -0.013551712036132812, -0.013155460357666016, -0.012759208679199219, -0.012362957000732422, -0.011966705322265625, -0.011570453643798828, -0.011174201965332031, -0.010777950286865234, -0.010381698608398438, -0.00998544692993164, -0.009589195251464844, -0.009192943572998047, -0.00879669189453125, -0.008400440216064453, -0.008004188537597656, -0.007607936859130859, -0.0072116851806640625, -0.006815433502197266, -0.006419181823730469, -0.006022930145263672, -0.005626678466796875, -0.005230426788330078, -0.004834175109863281, -0.004437923431396484, -0.0040416717529296875, -0.0036454200744628906, -0.0032491683959960938, -0.002852916717529297, -0.0024566650390625, -0.002060413360595703, -0.0016641616821289062, -0.0012679100036621094, -0.0008716583251953125, -0.0004754066467285156, -7.915496826171875e-05, 0.0003170967102050781, 0.000713348388671875, 0.0011096000671386719, 0.0015058517456054688, 0.0019021034240722656, 0.0022983551025390625, 0.0026946067810058594, 0.0030908584594726562, 0.003487110137939453, 0.00388336181640625, 0.004279613494873047, 0.004675865173339844, 0.005072116851806641, 0.0054683685302734375, 0.005864620208740234, 0.006260871887207031, 0.006657123565673828, 0.007053375244140625, 0.007449626922607422, 0.007845878601074219, 0.008242130279541016, 0.008638381958007812, 0.00903463363647461, 0.009430885314941406, 0.009827136993408203, 0.010223388671875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 5.0, 13.0, 11.0, 10.0, 26.0, 33.0, 59.0, 96.0, 242.0, 490.0, 1236.0, 3760.0, 16142.0, 260879.0, 730455.0, 26951.0, 5345.0, 1583.0, 642.0, 244.0, 155.0, 59.0, 32.0, 27.0, 18.0, 8.0, 6.0, 0.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.039337158203125, -0.03835701942443848, -0.03737688064575195, -0.03639674186706543, -0.035416603088378906, -0.03443646430969238, -0.03345632553100586, -0.032476186752319336, -0.03149604797363281, -0.03051590919494629, -0.029535770416259766, -0.028555631637573242, -0.02757549285888672, -0.026595354080200195, -0.025615215301513672, -0.02463507652282715, -0.023654937744140625, -0.0226747989654541, -0.021694660186767578, -0.020714521408081055, -0.01973438262939453, -0.018754243850708008, -0.017774105072021484, -0.01679396629333496, -0.015813827514648438, -0.014833688735961914, -0.01385354995727539, -0.012873411178588867, -0.011893272399902344, -0.01091313362121582, -0.009932994842529297, -0.008952856063842773, -0.00797271728515625, -0.0069925785064697266, -0.006012439727783203, -0.00503230094909668, -0.004052162170410156, -0.003072023391723633, -0.0020918846130371094, -0.001111745834350586, -0.0001316070556640625, 0.0008485317230224609, 0.0018286705017089844, 0.002808809280395508, 0.0037889480590820312, 0.004769086837768555, 0.005749225616455078, 0.0067293643951416016, 0.007709503173828125, 0.008689641952514648, 0.009669780731201172, 0.010649919509887695, 0.011630058288574219, 0.012610197067260742, 0.013590335845947266, 0.014570474624633789, 0.015550613403320312, 0.016530752182006836, 0.01751089096069336, 0.018491029739379883, 0.019471168518066406, 0.02045130729675293, 0.021431446075439453, 0.022411584854125977, 0.0233917236328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 4.0, 6.0, 1.0, 7.0, 7.0, 7.0, 4.0, 11.0, 7.0, 16.0, 20.0, 18.0, 29.0, 28.0, 30.0, 45.0, 57.0, 46.0, 70.0, 80.0, 84.0, 57.0, 64.0, 42.0, 44.0, 36.0, 34.0, 34.0, 19.0, 15.0, 20.0, 15.0, 11.0, 5.0, 2.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-8.040666580200195e-05, -7.82972201704979e-05, -7.618777453899384e-05, -7.407832890748978e-05, -7.196888327598572e-05, -6.985943764448166e-05, -6.77499920129776e-05, -6.564054638147354e-05, -6.353110074996948e-05, -6.142165511846542e-05, -5.9312209486961365e-05, -5.7202763855457306e-05, -5.509331822395325e-05, -5.298387259244919e-05, -5.087442696094513e-05, -4.876498132944107e-05, -4.665553569793701e-05, -4.454609006643295e-05, -4.2436644434928894e-05, -4.0327198803424835e-05, -3.8217753171920776e-05, -3.610830754041672e-05, -3.399886190891266e-05, -3.18894162774086e-05, -2.977997064590454e-05, -2.7670525014400482e-05, -2.5561079382896423e-05, -2.3451633751392365e-05, -2.1342188119888306e-05, -1.9232742488384247e-05, -1.7123296856880188e-05, -1.5013851225376129e-05, -1.290440559387207e-05, -1.0794959962368011e-05, -8.685514330863953e-06, -6.576068699359894e-06, -4.466623067855835e-06, -2.357177436351776e-06, -2.477318048477173e-07, 1.8617138266563416e-06, 3.9711594581604e-06, 6.080605089664459e-06, 8.190050721168518e-06, 1.0299496352672577e-05, 1.2408941984176636e-05, 1.4518387615680695e-05, 1.6627833247184753e-05, 1.8737278878688812e-05, 2.084672451019287e-05, 2.295617014169693e-05, 2.506561577320099e-05, 2.7175061404705048e-05, 2.9284507036209106e-05, 3.1393952667713165e-05, 3.3503398299217224e-05, 3.561284393072128e-05, 3.772228956222534e-05, 3.98317351937294e-05, 4.194118082523346e-05, 4.405062645673752e-05, 4.616007208824158e-05, 4.8269517719745636e-05, 5.0378963351249695e-05, 5.2488408982753754e-05, 5.459785461425781e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 5.0, 9.0, 12.0, 10.0, 19.0, 18.0, 20.0, 21.0, 36.0, 61.0, 96.0, 143.0, 233.0, 474.0, 1418.0, 6795.0, 74150.0, 927509.0, 31772.0, 3879.0, 956.0, 355.0, 172.0, 106.0, 72.0, 53.0, 32.0, 27.0, 24.0, 15.0, 12.0, 5.0, 10.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034576416015625, -0.03354024887084961, -0.03250408172607422, -0.03146791458129883, -0.030431747436523438, -0.029395580291748047, -0.028359413146972656, -0.027323246002197266, -0.026287078857421875, -0.025250911712646484, -0.024214744567871094, -0.023178577423095703, -0.022142410278320312, -0.021106243133544922, -0.02007007598876953, -0.01903390884399414, -0.01799774169921875, -0.01696157455444336, -0.01592540740966797, -0.014889240264892578, -0.013853073120117188, -0.012816905975341797, -0.011780738830566406, -0.010744571685791016, -0.009708404541015625, -0.008672237396240234, -0.007636070251464844, -0.006599903106689453, -0.0055637359619140625, -0.004527568817138672, -0.0034914016723632812, -0.0024552345275878906, -0.0014190673828125, -0.0003829002380371094, 0.0006532669067382812, 0.0016894340515136719, 0.0027256011962890625, 0.003761768341064453, 0.004797935485839844, 0.005834102630615234, 0.006870269775390625, 0.007906436920166016, 0.008942604064941406, 0.009978771209716797, 0.011014938354492188, 0.012051105499267578, 0.013087272644042969, 0.01412343978881836, 0.01515960693359375, 0.01619577407836914, 0.01723194122314453, 0.018268108367919922, 0.019304275512695312, 0.020340442657470703, 0.021376609802246094, 0.022412776947021484, 0.023448944091796875, 0.024485111236572266, 0.025521278381347656, 0.026557445526123047, 0.027593612670898438, 0.028629779815673828, 0.02966594696044922, 0.03070211410522461, 0.03173828125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 8.0, 3.0, 7.0, 6.0, 7.0, 10.0, 12.0, 10.0, 26.0, 40.0, 69.0, 97.0, 128.0, 148.0, 125.0, 81.0, 52.0, 44.0, 20.0, 20.0, 12.0, 14.0, 10.0, 7.0, 5.0, 7.0, 4.0, 5.0, 3.0, 0.0, 6.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007503509521484375, -0.007229030132293701, -0.006954550743103027, -0.0066800713539123535, -0.00640559196472168, -0.006131112575531006, -0.005856633186340332, -0.005582153797149658, -0.005307674407958984, -0.0050331950187683105, -0.004758715629577637, -0.004484236240386963, -0.004209756851196289, -0.003935277462005615, -0.0036607980728149414, -0.0033863186836242676, -0.0031118392944335938, -0.00283735990524292, -0.002562880516052246, -0.0022884011268615723, -0.0020139217376708984, -0.0017394423484802246, -0.0014649629592895508, -0.001190483570098877, -0.0009160041809082031, -0.0006415247917175293, -0.00036704540252685547, -9.256601333618164e-05, 0.0001819133758544922, 0.000456392765045166, 0.0007308721542358398, 0.0010053515434265137, 0.0012798309326171875, 0.0015543103218078613, 0.0018287897109985352, 0.002103269100189209, 0.002377748489379883, 0.0026522278785705566, 0.0029267072677612305, 0.0032011866569519043, 0.003475666046142578, 0.003750145435333252, 0.004024624824523926, 0.0042991042137146, 0.0045735836029052734, 0.004848062992095947, 0.005122542381286621, 0.005397021770477295, 0.005671501159667969, 0.005945980548858643, 0.006220459938049316, 0.00649493932723999, 0.006769418716430664, 0.007043898105621338, 0.007318377494812012, 0.0075928568840026855, 0.00786733627319336, 0.008141815662384033, 0.008416295051574707, 0.00869077444076538, 0.008965253829956055, 0.009239733219146729, 0.009514212608337402, 0.009788691997528076, 0.01006317138671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 13.0, 37.0, 97.0, 251.0, 250.0, 172.0, 95.0, 43.0, 18.0, 16.0, 4.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1545153558254242, -0.15064574778079987, -0.14677613973617554, -0.1429065465927124, -0.13903693854808807, -0.13516733050346375, -0.13129772245883942, -0.1274281144142151, -0.12355852127075195, -0.11968891322612762, -0.11581931263208389, -0.11194970458745956, -0.10808010399341583, -0.1042104959487915, -0.10034088790416718, -0.09647128731012344, -0.09260167926549911, -0.08873207122087479, -0.08486247062683105, -0.08099286258220673, -0.077123261988163, -0.07325365394353867, -0.06938405334949493, -0.0655144453048706, -0.061644840985536575, -0.057775236666202545, -0.053905632346868515, -0.050036028027534485, -0.046166419982910156, -0.042296819388866425, -0.038427211344242096, -0.034557607024908066, -0.030688010156154633, -0.026818405836820602, -0.022948801517486572, -0.019079195335507393, -0.015209591016173363, -0.011339986696839333, -0.007470380514860153, -0.003600776195526123, 0.0002688281238079071, 0.0041384329088032246, 0.008008037693798542, 0.011877642944455147, 0.015747247263789177, 0.019616851583123207, 0.023486457765102386, 0.027356062084436417, 0.031225666403770447, 0.03509527072310448, 0.03896487504243851, 0.042834483087062836, 0.04670408368110657, 0.050573691725730896, 0.054443296045064926, 0.058312900364398956, 0.062182504683732986, 0.06605210900306702, 0.06992171704769135, 0.07379131764173508, 0.0776609256863594, 0.08153052628040314, 0.08540013432502747, 0.0892697423696518, 0.09313934296369553]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 6.0, 4.0, 9.0, 15.0, 18.0, 27.0, 28.0, 40.0, 65.0, 57.0, 64.0, 92.0, 71.0, 70.0, 77.0, 61.0, 72.0, 57.0, 48.0, 36.0, 28.0, 16.0, 17.0, 7.0, 10.0, 7.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09033203125, -0.087941013276577, -0.08554999530315399, -0.08315898478031158, -0.08076796680688858, -0.07837694883346558, -0.07598593831062317, -0.07359492033720016, -0.07120390236377716, -0.06881288439035416, -0.06642186641693115, -0.06403085589408875, -0.06163983792066574, -0.05924881994724274, -0.05685780569911003, -0.054466791450977325, -0.05207577347755432, -0.04968475550413132, -0.04729374125599861, -0.044902727007865906, -0.0425117090344429, -0.0401206910610199, -0.03772967681288719, -0.035338662564754486, -0.03294764459133148, -0.030556628480553627, -0.028165612369775772, -0.025774596258997917, -0.023383580148220062, -0.020992564037442207, -0.018601547926664352, -0.016210531815886497, -0.013819515705108643, -0.011428499594330788, -0.009037483483552933, -0.006646467372775078, -0.004255451261997223, -0.001864435151219368, 0.0005265809595584869, 0.002917597070336342, 0.005308613181114197, 0.007699629291892052, 0.010090645402669907, 0.012481661513447762, 0.014872677624225616, 0.01726369373500347, 0.019654709845781326, 0.02204572595655918, 0.024436742067337036, 0.02682775817811489, 0.029218774288892746, 0.03160978853702545, 0.034000806510448456, 0.03639182448387146, 0.038782838732004166, 0.04117385298013687, 0.043564870953559875, 0.04595588892698288, 0.048346903175115585, 0.05073791742324829, 0.053128935396671295, 0.0555199533700943, 0.057910967618227005, 0.06030198186635971, 0.06269299983978271]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 4.0, 14.0, 7.0, 12.0, 21.0, 62.0, 74.0, 142.0, 271.0, 461.0, 993.0, 2541.0, 8302.0, 461607.0, 3698512.0, 16264.0, 2544.0, 975.0, 571.0, 330.0, 217.0, 129.0, 80.0, 51.0, 32.0, 19.0, 13.0, 10.0, 13.0, 7.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03741455078125, -0.03617429733276367, -0.034934043884277344, -0.033693790435791016, -0.03245353698730469, -0.03121328353881836, -0.02997303009033203, -0.028732776641845703, -0.027492523193359375, -0.026252269744873047, -0.02501201629638672, -0.02377176284790039, -0.022531509399414062, -0.021291255950927734, -0.020051002502441406, -0.018810749053955078, -0.01757049560546875, -0.016330242156982422, -0.015089988708496094, -0.013849735260009766, -0.012609481811523438, -0.01136922836303711, -0.010128974914550781, -0.008888721466064453, -0.007648468017578125, -0.006408214569091797, -0.005167961120605469, -0.003927707672119141, -0.0026874542236328125, -0.0014472007751464844, -0.00020694732666015625, 0.0010333061218261719, 0.0022735595703125, 0.003513813018798828, 0.004754066467285156, 0.005994319915771484, 0.0072345733642578125, 0.00847482681274414, 0.009715080261230469, 0.010955333709716797, 0.012195587158203125, 0.013435840606689453, 0.014676094055175781, 0.01591634750366211, 0.017156600952148438, 0.018396854400634766, 0.019637107849121094, 0.020877361297607422, 0.02211761474609375, 0.023357868194580078, 0.024598121643066406, 0.025838375091552734, 0.027078628540039062, 0.02831888198852539, 0.02955913543701172, 0.030799388885498047, 0.032039642333984375, 0.0332798957824707, 0.03452014923095703, 0.03576040267944336, 0.03700065612792969, 0.038240909576416016, 0.039481163024902344, 0.04072141647338867, 0.041961669921875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 5.0, 4.0, 13.0, 44.0, 105.0, 196.0, 247.0, 207.0, 111.0, 40.0, 23.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01549530029296875, -0.01495349407196045, -0.014411687850952148, -0.013869881629943848, -0.013328075408935547, -0.012786269187927246, -0.012244462966918945, -0.011702656745910645, -0.011160850524902344, -0.010619044303894043, -0.010077238082885742, -0.009535431861877441, -0.00899362564086914, -0.00845181941986084, -0.007910013198852539, -0.007368206977844238, -0.0068264007568359375, -0.006284594535827637, -0.005742788314819336, -0.005200982093811035, -0.004659175872802734, -0.004117369651794434, -0.003575563430786133, -0.003033757209777832, -0.0024919509887695312, -0.0019501447677612305, -0.0014083385467529297, -0.0008665323257446289, -0.0003247261047363281, 0.00021708011627197266, 0.0007588863372802734, 0.0013006925582885742, 0.001842498779296875, 0.0023843050003051758, 0.0029261112213134766, 0.0034679174423217773, 0.004009723663330078, 0.004551529884338379, 0.00509333610534668, 0.0056351423263549805, 0.006176948547363281, 0.006718754768371582, 0.007260560989379883, 0.007802367210388184, 0.008344173431396484, 0.008885979652404785, 0.009427785873413086, 0.009969592094421387, 0.010511398315429688, 0.011053204536437988, 0.011595010757446289, 0.01213681697845459, 0.01267862319946289, 0.013220429420471191, 0.013762235641479492, 0.014304041862487793, 0.014845848083496094, 0.015387654304504395, 0.015929460525512695, 0.016471266746520996, 0.017013072967529297, 0.017554879188537598, 0.0180966854095459, 0.0186384916305542, 0.0191802978515625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 7.0, 23.0, 20.0, 23.0, 37.0, 82.0, 137.0, 234.0, 470.0, 1080.0, 2765.0, 11995.0, 230289.0, 3790630.0, 142427.0, 9636.0, 2359.0, 919.0, 484.0, 244.0, 131.0, 82.0, 63.0, 48.0, 33.0, 24.0, 9.0, 10.0, 7.0, 0.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02899169921875, -0.028007030487060547, -0.027022361755371094, -0.02603769302368164, -0.025053024291992188, -0.024068355560302734, -0.02308368682861328, -0.022099018096923828, -0.021114349365234375, -0.020129680633544922, -0.01914501190185547, -0.018160343170166016, -0.017175674438476562, -0.01619100570678711, -0.015206336975097656, -0.014221668243408203, -0.01323699951171875, -0.012252330780029297, -0.011267662048339844, -0.01028299331665039, -0.009298324584960938, -0.008313655853271484, -0.007328987121582031, -0.006344318389892578, -0.005359649658203125, -0.004374980926513672, -0.0033903121948242188, -0.0024056434631347656, -0.0014209747314453125, -0.0004363059997558594, 0.0005483627319335938, 0.0015330314636230469, 0.0025177001953125, 0.003502368927001953, 0.004487037658691406, 0.005471706390380859, 0.0064563751220703125, 0.007441043853759766, 0.008425712585449219, 0.009410381317138672, 0.010395050048828125, 0.011379718780517578, 0.012364387512207031, 0.013349056243896484, 0.014333724975585938, 0.01531839370727539, 0.016303062438964844, 0.017287731170654297, 0.01827239990234375, 0.019257068634033203, 0.020241737365722656, 0.02122640609741211, 0.022211074829101562, 0.023195743560791016, 0.02418041229248047, 0.025165081024169922, 0.026149749755859375, 0.027134418487548828, 0.02811908721923828, 0.029103755950927734, 0.030088424682617188, 0.03107309341430664, 0.032057762145996094, 0.03304243087768555, 0.034027099609375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 3.0, 12.0, 14.0, 24.0, 30.0, 35.0, 57.0, 81.0, 127.0, 176.0, 214.0, 288.0, 396.0, 441.0, 550.0, 385.0, 347.0, 313.0, 204.0, 108.0, 89.0, 62.0, 45.0, 21.0, 19.0, 12.0, 6.0, 9.0, 2.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0149688720703125, -0.014580845832824707, -0.014192819595336914, -0.013804793357849121, -0.013416767120361328, -0.013028740882873535, -0.012640714645385742, -0.01225268840789795, -0.011864662170410156, -0.011476635932922363, -0.01108860969543457, -0.010700583457946777, -0.010312557220458984, -0.009924530982971191, -0.009536504745483398, -0.009148478507995605, -0.008760452270507812, -0.00837242603302002, -0.007984399795532227, -0.007596373558044434, -0.007208347320556641, -0.006820321083068848, -0.006432294845581055, -0.006044268608093262, -0.005656242370605469, -0.005268216133117676, -0.004880189895629883, -0.00449216365814209, -0.004104137420654297, -0.003716111183166504, -0.003328084945678711, -0.002940058708190918, -0.002552032470703125, -0.002164006233215332, -0.001775979995727539, -0.001387953758239746, -0.0009999275207519531, -0.0006119012832641602, -0.0002238750457763672, 0.00016415119171142578, 0.0005521774291992188, 0.0009402036666870117, 0.0013282299041748047, 0.0017162561416625977, 0.0021042823791503906, 0.0024923086166381836, 0.0028803348541259766, 0.0032683610916137695, 0.0036563873291015625, 0.0040444135665893555, 0.0044324398040771484, 0.004820466041564941, 0.005208492279052734, 0.005596518516540527, 0.00598454475402832, 0.006372570991516113, 0.006760597229003906, 0.007148623466491699, 0.007536649703979492, 0.007924675941467285, 0.008312702178955078, 0.008700728416442871, 0.009088754653930664, 0.009476780891418457, 0.00986480712890625]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 9.0, 38.0, 218.0, 505.0, 203.0, 28.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18809863924980164, -0.1812610775232315, -0.17442351579666138, -0.16758596897125244, -0.1607484072446823, -0.15391084551811218, -0.14707328379154205, -0.14023572206497192, -0.1333981603384018, -0.12656059861183167, -0.11972304433584213, -0.112885482609272, -0.10604792088270187, -0.09921036660671234, -0.09237280488014221, -0.08553524315357208, -0.07869768887758255, -0.07186012715101242, -0.06502257287502289, -0.05818501114845276, -0.05134744942188263, -0.0445098914206028, -0.03767233341932297, -0.030834771692752838, -0.023997213691473007, -0.017159653827548027, -0.010322094894945621, -0.003484535962343216, 0.0033530239015817642, 0.010190583765506744, 0.017028141766786575, 0.023865703493356705, 0.030703261494636536, 0.03754081949591637, 0.044378381222486496, 0.05121593922376633, 0.058053500950336456, 0.06489105522632599, 0.07172861695289612, 0.07856617867946625, 0.08540374040603638, 0.0922413021326065, 0.09907885640859604, 0.10591641813516617, 0.1127539798617363, 0.11959153413772583, 0.12642909586429596, 0.1332666575908661, 0.14010420441627502, 0.14694176614284515, 0.15377932786941528, 0.16061687469482422, 0.16745443642139435, 0.17429199814796448, 0.1811295598745346, 0.18796712160110474, 0.19480468332767487, 0.201642245054245, 0.20847980678081512, 0.21531736850738525, 0.2221549153327942, 0.22899247705936432, 0.23583003878593445, 0.24266760051250458, 0.2495051622390747]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 7.0, 22.0, 26.0, 31.0, 51.0, 54.0, 67.0, 87.0, 87.0, 66.0, 70.0, 72.0, 72.0, 82.0, 48.0, 49.0, 33.0, 23.0, 17.0, 14.0, 6.0, 2.0, 3.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07989686727523804, -0.07736919075250626, -0.07484152168035507, -0.07231384515762329, -0.0697861760854721, -0.06725849956274033, -0.06473082304000854, -0.06220315024256706, -0.05967547744512558, -0.0571478046476841, -0.054620131850242615, -0.052092455327510834, -0.04956478253006935, -0.04703710973262787, -0.04450943320989609, -0.041981760412454605, -0.03945408761501312, -0.03692641481757164, -0.03439874202013016, -0.031871065497398376, -0.029343392699956894, -0.02681571990251541, -0.02428804524242878, -0.021760370582342148, -0.019232697784900665, -0.016705024987459183, -0.014177350327372551, -0.011649676598608494, -0.009122002869844437, -0.0065943291410803795, -0.004066655412316322, -0.0015389807522296906, 0.000988692045211792, 0.003516365773975849, 0.006044039502739906, 0.008571713231503963, 0.01109938696026802, 0.013627060689032078, 0.016154734417796135, 0.018682409077882767, 0.02121008187532425, 0.023737754672765732, 0.026265429332852364, 0.028793103992938995, 0.03132077679038048, 0.03384844958782196, 0.03637612611055374, 0.038903798907995224, 0.04143147170543671, 0.04395914450287819, 0.04648681730031967, 0.04901449382305145, 0.051542166620492935, 0.05406983941793442, 0.0565975159406662, 0.05912518873810768, 0.061652861535549164, 0.06418053805828094, 0.06670820713043213, 0.06923588365316391, 0.07176356017589569, 0.07429122924804688, 0.07681890577077866, 0.07934658229351044, 0.08187425136566162]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 14.0, 6.0, 8.0, 8.0, 15.0, 19.0, 21.0, 35.0, 44.0, 54.0, 73.0, 98.0, 115.0, 145.0, 233.0, 290.0, 419.0, 634.0, 1153.0, 4126.0, 42407.0, 811131.0, 173731.0, 9189.0, 1941.0, 851.0, 451.0, 363.0, 230.0, 170.0, 122.0, 101.0, 80.0, 60.0, 47.0, 35.0, 36.0, 21.0, 11.0, 18.0, 11.0, 9.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05047607421875, -0.04902172088623047, -0.04756736755371094, -0.046113014221191406, -0.044658660888671875, -0.043204307556152344, -0.04174995422363281, -0.04029560089111328, -0.03884124755859375, -0.03738689422607422, -0.03593254089355469, -0.034478187561035156, -0.033023834228515625, -0.031569480895996094, -0.030115127563476562, -0.02866077423095703, -0.0272064208984375, -0.02575206756591797, -0.024297714233398438, -0.022843360900878906, -0.021389007568359375, -0.019934654235839844, -0.018480300903320312, -0.01702594757080078, -0.01557159423828125, -0.014117240905761719, -0.012662887573242188, -0.011208534240722656, -0.009754180908203125, -0.008299827575683594, -0.0068454742431640625, -0.005391120910644531, -0.003936767578125, -0.0024824142456054688, -0.0010280609130859375, 0.00042629241943359375, 0.001880645751953125, 0.0033349990844726562, 0.0047893524169921875, 0.006243705749511719, 0.00769805908203125, 0.009152412414550781, 0.010606765747070312, 0.012061119079589844, 0.013515472412109375, 0.014969825744628906, 0.016424179077148438, 0.01787853240966797, 0.0193328857421875, 0.02078723907470703, 0.022241592407226562, 0.023695945739746094, 0.025150299072265625, 0.026604652404785156, 0.028059005737304688, 0.02951335906982422, 0.03096771240234375, 0.03242206573486328, 0.03387641906738281, 0.035330772399902344, 0.036785125732421875, 0.038239479064941406, 0.03969383239746094, 0.04114818572998047, 0.0426025390625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 16.0, 44.0, 108.0, 188.0, 251.0, 191.0, 133.0, 46.0, 16.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.01554107666015625, -0.014997124671936035, -0.01445317268371582, -0.013909220695495605, -0.01336526870727539, -0.012821316719055176, -0.012277364730834961, -0.011733412742614746, -0.011189460754394531, -0.010645508766174316, -0.010101556777954102, -0.009557604789733887, -0.009013652801513672, -0.008469700813293457, -0.007925748825073242, -0.007381796836853027, -0.0068378448486328125, -0.006293892860412598, -0.005749940872192383, -0.005205988883972168, -0.004662036895751953, -0.004118084907531738, -0.0035741329193115234, -0.0030301809310913086, -0.0024862289428710938, -0.001942276954650879, -0.001398324966430664, -0.0008543729782104492, -0.0003104209899902344, 0.00023353099822998047, 0.0007774829864501953, 0.0013214349746704102, 0.001865386962890625, 0.00240933895111084, 0.0029532909393310547, 0.0034972429275512695, 0.004041194915771484, 0.004585146903991699, 0.005129098892211914, 0.005673050880432129, 0.006217002868652344, 0.006760954856872559, 0.0073049068450927734, 0.007848858833312988, 0.008392810821533203, 0.008936762809753418, 0.009480714797973633, 0.010024666786193848, 0.010568618774414062, 0.011112570762634277, 0.011656522750854492, 0.012200474739074707, 0.012744426727294922, 0.013288378715515137, 0.013832330703735352, 0.014376282691955566, 0.014920234680175781, 0.015464186668395996, 0.01600813865661621, 0.016552090644836426, 0.01709604263305664, 0.017639994621276855, 0.01818394660949707, 0.018727898597717285, 0.0192718505859375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 1.0, 5.0, 7.0, 8.0, 11.0, 14.0, 28.0, 25.0, 38.0, 40.0, 87.0, 139.0, 236.0, 430.0, 786.0, 1911.0, 8974.0, 218744.0, 780884.0, 30422.0, 3298.0, 1147.0, 522.0, 292.0, 162.0, 107.0, 76.0, 43.0, 41.0, 18.0, 21.0, 8.0, 10.0, 5.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044525146484375, -0.04294776916503906, -0.041370391845703125, -0.03979301452636719, -0.03821563720703125, -0.03663825988769531, -0.035060882568359375, -0.03348350524902344, -0.0319061279296875, -0.030328750610351562, -0.028751373291015625, -0.027173995971679688, -0.02559661865234375, -0.024019241333007812, -0.022441864013671875, -0.020864486694335938, -0.019287109375, -0.017709732055664062, -0.016132354736328125, -0.014554977416992188, -0.01297760009765625, -0.011400222778320312, -0.009822845458984375, -0.008245468139648438, -0.0066680908203125, -0.0050907135009765625, -0.003513336181640625, -0.0019359588623046875, -0.00035858154296875, 0.0012187957763671875, 0.002796173095703125, 0.0043735504150390625, 0.005950927734375, 0.0075283050537109375, 0.009105682373046875, 0.010683059692382812, 0.01226043701171875, 0.013837814331054688, 0.015415191650390625, 0.016992568969726562, 0.0185699462890625, 0.020147323608398438, 0.021724700927734375, 0.023302078247070312, 0.02487945556640625, 0.026456832885742188, 0.028034210205078125, 0.029611587524414062, 0.03118896484375, 0.03276634216308594, 0.034343719482421875, 0.03592109680175781, 0.03749847412109375, 0.03907585144042969, 0.040653228759765625, 0.04223060607910156, 0.0438079833984375, 0.04538536071777344, 0.046962738037109375, 0.04854011535644531, 0.05011749267578125, 0.05169486999511719, 0.053272247314453125, 0.05484962463378906, 0.056427001953125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 0.0, 0.0, 4.0, 2.0, 3.0, 9.0, 4.0, 15.0, 11.0, 22.0, 20.0, 21.0, 25.0, 28.0, 30.0, 26.0, 37.0, 40.0, 27.0, 35.0, 43.0, 46.0, 40.0, 48.0, 29.0, 32.0, 31.0, 36.0, 44.0, 38.0, 33.0, 36.0, 35.0, 23.0, 15.0, 18.0, 12.0, 16.0, 9.0, 13.0, 10.0, 8.0, 7.0, 4.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01213836669921875, -0.011754989624023438, -0.011371612548828125, -0.010988235473632812, -0.0106048583984375, -0.010221481323242188, -0.009838104248046875, -0.009454727172851562, -0.00907135009765625, -0.008687973022460938, -0.008304595947265625, -0.007921218872070312, -0.007537841796875, -0.0071544647216796875, -0.006771087646484375, -0.0063877105712890625, -0.00600433349609375, -0.0056209564208984375, -0.005237579345703125, -0.0048542022705078125, -0.0044708251953125, -0.0040874481201171875, -0.003704071044921875, -0.0033206939697265625, -0.00293731689453125, -0.0025539398193359375, -0.002170562744140625, -0.0017871856689453125, -0.00140380859375, -0.0010204315185546875, -0.000637054443359375, -0.0002536773681640625, 0.00012969970703125, 0.0005130767822265625, 0.000896453857421875, 0.0012798309326171875, 0.0016632080078125, 0.0020465850830078125, 0.002429962158203125, 0.0028133392333984375, 0.00319671630859375, 0.0035800933837890625, 0.003963470458984375, 0.0043468475341796875, 0.004730224609375, 0.0051136016845703125, 0.005496978759765625, 0.0058803558349609375, 0.00626373291015625, 0.0066471099853515625, 0.007030487060546875, 0.0074138641357421875, 0.0077972412109375, 0.008180618286132812, 0.008563995361328125, 0.008947372436523438, 0.00933074951171875, 0.009714126586914062, 0.010097503662109375, 0.010480880737304688, 0.0108642578125, 0.011247634887695312, 0.011631011962890625, 0.012014389038085938, 0.01239776611328125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 2.0, 2.0, 6.0, 6.0, 12.0, 18.0, 28.0, 44.0, 65.0, 98.0, 181.0, 374.0, 874.0, 2171.0, 6945.0, 38067.0, 560182.0, 401083.0, 29071.0, 5882.0, 1890.0, 753.0, 331.0, 172.0, 99.0, 62.0, 35.0, 23.0, 15.0, 16.0, 9.0, 5.0, 4.0, 4.0, 3.0, 7.0, 1.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.014801025390625, -0.014377355575561523, -0.013953685760498047, -0.01353001594543457, -0.013106346130371094, -0.012682676315307617, -0.01225900650024414, -0.011835336685180664, -0.011411666870117188, -0.010987997055053711, -0.010564327239990234, -0.010140657424926758, -0.009716987609863281, -0.009293317794799805, -0.008869647979736328, -0.008445978164672852, -0.008022308349609375, -0.0075986385345458984, -0.007174968719482422, -0.006751298904418945, -0.006327629089355469, -0.005903959274291992, -0.005480289459228516, -0.005056619644165039, -0.0046329498291015625, -0.004209280014038086, -0.0037856101989746094, -0.003361940383911133, -0.0029382705688476562, -0.0025146007537841797, -0.002090930938720703, -0.0016672611236572266, -0.00124359130859375, -0.0008199214935302734, -0.0003962516784667969, 2.7418136596679688e-05, 0.00045108795166015625, 0.0008747577667236328, 0.0012984275817871094, 0.001722097396850586, 0.0021457672119140625, 0.002569437026977539, 0.0029931068420410156, 0.003416776657104492, 0.0038404464721679688, 0.004264116287231445, 0.004687786102294922, 0.0051114559173583984, 0.005535125732421875, 0.0059587955474853516, 0.006382465362548828, 0.006806135177612305, 0.007229804992675781, 0.007653474807739258, 0.008077144622802734, 0.008500814437866211, 0.008924484252929688, 0.009348154067993164, 0.00977182388305664, 0.010195493698120117, 0.010619163513183594, 0.01104283332824707, 0.011466503143310547, 0.011890172958374023, 0.0123138427734375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 6.0, 12.0, 15.0, 13.0, 24.0, 33.0, 26.0, 44.0, 44.0, 64.0, 83.0, 83.0, 81.0, 95.0, 71.0, 70.0, 41.0, 41.0, 41.0, 19.0, 17.0, 21.0, 14.0, 5.0, 12.0, 9.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.967782974243164e-05, -6.712786853313446e-05, -6.457790732383728e-05, -6.20279461145401e-05, -5.947798490524292e-05, -5.692802369594574e-05, -5.437806248664856e-05, -5.182810127735138e-05, -4.92781400680542e-05, -4.672817885875702e-05, -4.417821764945984e-05, -4.162825644016266e-05, -3.907829523086548e-05, -3.65283340215683e-05, -3.397837281227112e-05, -3.142841160297394e-05, -2.8878450393676758e-05, -2.6328489184379578e-05, -2.3778527975082397e-05, -2.1228566765785217e-05, -1.8678605556488037e-05, -1.6128644347190857e-05, -1.3578683137893677e-05, -1.1028721928596497e-05, -8.478760719299316e-06, -5.928799510002136e-06, -3.378838300704956e-06, -8.288770914077759e-07, 1.7210841178894043e-06, 4.2710453271865845e-06, 6.821006536483765e-06, 9.370967745780945e-06, 1.1920928955078125e-05, 1.4470890164375305e-05, 1.7020851373672485e-05, 1.9570812582969666e-05, 2.2120773792266846e-05, 2.4670735001564026e-05, 2.7220696210861206e-05, 2.9770657420158386e-05, 3.2320618629455566e-05, 3.4870579838752747e-05, 3.742054104804993e-05, 3.997050225734711e-05, 4.252046346664429e-05, 4.507042467594147e-05, 4.762038588523865e-05, 5.017034709453583e-05, 5.272030830383301e-05, 5.527026951313019e-05, 5.782023072242737e-05, 6.037019193172455e-05, 6.292015314102173e-05, 6.547011435031891e-05, 6.802007555961609e-05, 7.057003676891327e-05, 7.311999797821045e-05, 7.566995918750763e-05, 7.821992039680481e-05, 8.076988160610199e-05, 8.331984281539917e-05, 8.586980402469635e-05, 8.841976523399353e-05, 9.096972644329071e-05, 9.351968765258789e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 5.0, 2.0, 4.0, 9.0, 20.0, 25.0, 35.0, 45.0, 87.0, 134.0, 297.0, 645.0, 2300.0, 22689.0, 926168.0, 90032.0, 4270.0, 944.0, 362.0, 181.0, 111.0, 53.0, 46.0, 31.0, 24.0, 6.0, 10.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.031402587890625, -0.03063058853149414, -0.02985858917236328, -0.029086589813232422, -0.028314590454101562, -0.027542591094970703, -0.026770591735839844, -0.025998592376708984, -0.025226593017578125, -0.024454593658447266, -0.023682594299316406, -0.022910594940185547, -0.022138595581054688, -0.021366596221923828, -0.02059459686279297, -0.01982259750366211, -0.01905059814453125, -0.01827859878540039, -0.01750659942626953, -0.016734600067138672, -0.015962600708007812, -0.015190601348876953, -0.014418601989746094, -0.013646602630615234, -0.012874603271484375, -0.012102603912353516, -0.011330604553222656, -0.010558605194091797, -0.009786605834960938, -0.009014606475830078, -0.008242607116699219, -0.007470607757568359, -0.0066986083984375, -0.005926609039306641, -0.005154609680175781, -0.004382610321044922, -0.0036106109619140625, -0.002838611602783203, -0.0020666122436523438, -0.0012946128845214844, -0.000522613525390625, 0.0002493858337402344, 0.0010213851928710938, 0.0017933845520019531, 0.0025653839111328125, 0.003337383270263672, 0.004109382629394531, 0.004881381988525391, 0.00565338134765625, 0.006425380706787109, 0.007197380065917969, 0.007969379425048828, 0.008741378784179688, 0.009513378143310547, 0.010285377502441406, 0.011057376861572266, 0.011829376220703125, 0.012601375579833984, 0.013373374938964844, 0.014145374298095703, 0.014917373657226562, 0.015689373016357422, 0.01646137237548828, 0.01723337173461914, 0.01800537109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 5.0, 6.0, 19.0, 13.0, 23.0, 27.0, 28.0, 56.0, 72.0, 87.0, 125.0, 110.0, 108.0, 100.0, 58.0, 36.0, 25.0, 26.0, 16.0, 16.0, 12.0, 9.0, 2.0, 4.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005786895751953125, -0.005539357662200928, -0.0052918195724487305, -0.005044281482696533, -0.004796743392944336, -0.004549205303192139, -0.004301667213439941, -0.004054129123687744, -0.003806591033935547, -0.0035590529441833496, -0.0033115148544311523, -0.003063976764678955, -0.002816438674926758, -0.0025689005851745605, -0.0023213624954223633, -0.002073824405670166, -0.0018262863159179688, -0.0015787482261657715, -0.0013312101364135742, -0.001083672046661377, -0.0008361339569091797, -0.0005885958671569824, -0.00034105777740478516, -9.351968765258789e-05, 0.00015401840209960938, 0.00040155649185180664, 0.0006490945816040039, 0.0008966326713562012, 0.0011441707611083984, 0.0013917088508605957, 0.001639246940612793, 0.0018867850303649902, 0.0021343231201171875, 0.0023818612098693848, 0.002629399299621582, 0.0028769373893737793, 0.0031244754791259766, 0.003372013568878174, 0.003619551658630371, 0.0038670897483825684, 0.004114627838134766, 0.004362165927886963, 0.00460970401763916, 0.004857242107391357, 0.005104780197143555, 0.005352318286895752, 0.005599856376647949, 0.0058473944664001465, 0.006094932556152344, 0.006342470645904541, 0.006590008735656738, 0.0068375468254089355, 0.007085084915161133, 0.00733262300491333, 0.007580161094665527, 0.007827699184417725, 0.008075237274169922, 0.00832277536392212, 0.008570313453674316, 0.008817851543426514, 0.009065389633178711, 0.009312927722930908, 0.009560465812683105, 0.009808003902435303, 0.0100555419921875]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 28.0, 299.0, 516.0, 125.0, 30.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2858009338378906, -0.2782890796661377, -0.2707771956920624, -0.26326534152030945, -0.25575345754623413, -0.2482416033744812, -0.24072974920272827, -0.23321788012981415, -0.22570601105690002, -0.2181941419839859, -0.21068227291107178, -0.20317041873931885, -0.19565854966640472, -0.1881466805934906, -0.18063482642173767, -0.17312295734882355, -0.16561108827590942, -0.1580992192029953, -0.15058735013008118, -0.14307549595832825, -0.13556362688541412, -0.1280517578125, -0.12053989619016647, -0.11302803456783295, -0.10551616549491882, -0.0980042964220047, -0.09049243479967117, -0.08298057317733765, -0.07546870410442352, -0.0679568350315094, -0.06044497340917587, -0.05293310806155205, -0.04542122781276703, -0.037909362465143204, -0.03039749711751938, -0.022885631769895554, -0.015373766422271729, -0.007861901074647903, -0.00035003572702407837, 0.007161829620599747, 0.014673694968223572, 0.022185560315847397, 0.029697425663471222, 0.03720929101109505, 0.04472115635871887, 0.0522330217063427, 0.05974488705396652, 0.06725674867630005, 0.07476861774921417, 0.0822804868221283, 0.08979234844446182, 0.09730421006679535, 0.10481607913970947, 0.1123279482126236, 0.11983980983495712, 0.12735167145729065, 0.13486354053020477, 0.1423754096031189, 0.14988726377487183, 0.15739913284778595, 0.16491100192070007, 0.1724228709936142, 0.17993474006652832, 0.18744659423828125, 0.19495846331119537]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 8.0, 5.0, 9.0, 13.0, 13.0, 13.0, 15.0, 22.0, 20.0, 26.0, 34.0, 27.0, 55.0, 36.0, 46.0, 52.0, 63.0, 48.0, 39.0, 58.0, 50.0, 48.0, 46.0, 38.0, 43.0, 39.0, 22.0, 19.0, 13.0, 20.0, 8.0, 16.0, 7.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04639232158660889, -0.044932566583156586, -0.043472807854413986, -0.04201304912567139, -0.040553294122219086, -0.039093539118766785, -0.037633780390024185, -0.036174021661281586, -0.034714266657829285, -0.033254511654376984, -0.031794752925634384, -0.030334996059536934, -0.028875239193439484, -0.027415482327342033, -0.025955725461244583, -0.024495968595147133, -0.023036211729049683, -0.021576454862952232, -0.020116697996854782, -0.018656941130757332, -0.01719718426465988, -0.01573742739856243, -0.014277670532464981, -0.01281791366636753, -0.01135815680027008, -0.00989839993417263, -0.00843864306807518, -0.00697888620197773, -0.0055191293358802795, -0.004059372469782829, -0.002599615603685379, -0.0011398587375879288, 0.0003198981285095215, 0.0017796549946069717, 0.003239411860704422, 0.004699168726801872, 0.0061589255928993225, 0.007618682458996773, 0.009078439325094223, 0.010538196191191673, 0.011997953057289124, 0.013457709923386574, 0.014917466789484024, 0.016377223655581474, 0.017836980521678925, 0.019296737387776375, 0.020756494253873825, 0.022216251119971275, 0.023676007986068726, 0.025135764852166176, 0.026595521718263626, 0.028055278584361076, 0.029515035450458527, 0.030974792316555977, 0.03243454918265343, 0.03389430791139603, 0.03535406291484833, 0.03681381791830063, 0.03827357664704323, 0.03973333537578583, 0.04119309037923813, 0.04265284538269043, 0.04411260411143303, 0.04557236284017563, 0.04703211784362793]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 11.0, 6.0, 16.0, 34.0, 28.0, 57.0, 72.0, 128.0, 172.0, 321.0, 574.0, 1042.0, 2769.0, 6630.0, 42508.0, 3946726.0, 179045.0, 9150.0, 2402.0, 871.0, 570.0, 364.0, 239.0, 161.0, 93.0, 84.0, 70.0, 38.0, 26.0, 26.0, 14.0, 13.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03173828125, -0.030703067779541016, -0.02966785430908203, -0.028632640838623047, -0.027597427368164062, -0.026562213897705078, -0.025527000427246094, -0.02449178695678711, -0.023456573486328125, -0.02242136001586914, -0.021386146545410156, -0.020350933074951172, -0.019315719604492188, -0.018280506134033203, -0.01724529266357422, -0.016210079193115234, -0.01517486572265625, -0.014139652252197266, -0.013104438781738281, -0.012069225311279297, -0.011034011840820312, -0.009998798370361328, -0.008963584899902344, -0.00792837142944336, -0.006893157958984375, -0.005857944488525391, -0.004822731018066406, -0.003787517547607422, -0.0027523040771484375, -0.0017170906066894531, -0.0006818771362304688, 0.0003533363342285156, 0.0013885498046875, 0.0024237632751464844, 0.0034589767456054688, 0.004494190216064453, 0.0055294036865234375, 0.006564617156982422, 0.007599830627441406, 0.00863504409790039, 0.009670257568359375, 0.01070547103881836, 0.011740684509277344, 0.012775897979736328, 0.013811111450195312, 0.014846324920654297, 0.01588153839111328, 0.016916751861572266, 0.01795196533203125, 0.018987178802490234, 0.02002239227294922, 0.021057605743408203, 0.022092819213867188, 0.023128032684326172, 0.024163246154785156, 0.02519845962524414, 0.026233673095703125, 0.02726888656616211, 0.028304100036621094, 0.029339313507080078, 0.030374526977539062, 0.03140974044799805, 0.03244495391845703, 0.033480167388916016, 0.034515380859375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 10.0, 40.0, 85.0, 190.0, 259.0, 200.0, 142.0, 52.0, 20.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01702880859375, -0.016456127166748047, -0.015883445739746094, -0.01531076431274414, -0.014738082885742188, -0.014165401458740234, -0.013592720031738281, -0.013020038604736328, -0.012447357177734375, -0.011874675750732422, -0.011301994323730469, -0.010729312896728516, -0.010156631469726562, -0.00958395004272461, -0.009011268615722656, -0.008438587188720703, -0.00786590576171875, -0.007293224334716797, -0.006720542907714844, -0.006147861480712891, -0.0055751800537109375, -0.005002498626708984, -0.004429817199707031, -0.003857135772705078, -0.003284454345703125, -0.002711772918701172, -0.0021390914916992188, -0.0015664100646972656, -0.0009937286376953125, -0.0004210472106933594, 0.00015163421630859375, 0.0007243156433105469, 0.0012969970703125, 0.0018696784973144531, 0.0024423599243164062, 0.0030150413513183594, 0.0035877227783203125, 0.004160404205322266, 0.004733085632324219, 0.005305767059326172, 0.005878448486328125, 0.006451129913330078, 0.007023811340332031, 0.007596492767333984, 0.008169174194335938, 0.00874185562133789, 0.009314537048339844, 0.009887218475341797, 0.01045989990234375, 0.011032581329345703, 0.011605262756347656, 0.01217794418334961, 0.012750625610351562, 0.013323307037353516, 0.013895988464355469, 0.014468669891357422, 0.015041351318359375, 0.015614032745361328, 0.01618671417236328, 0.016759395599365234, 0.017332077026367188, 0.01790475845336914, 0.018477439880371094, 0.019050121307373047, 0.019622802734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 6.0, 2.0, 9.0, 9.0, 16.0, 23.0, 24.0, 37.0, 57.0, 73.0, 135.0, 237.0, 461.0, 946.0, 3401.0, 27760.0, 3553829.0, 592231.0, 11211.0, 2177.0, 780.0, 362.0, 181.0, 104.0, 76.0, 39.0, 29.0, 24.0, 17.0, 7.0, 9.0, 3.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02984619140625, -0.02873373031616211, -0.02762126922607422, -0.026508808135986328, -0.025396347045898438, -0.024283885955810547, -0.023171424865722656, -0.022058963775634766, -0.020946502685546875, -0.019834041595458984, -0.018721580505371094, -0.017609119415283203, -0.016496658325195312, -0.015384197235107422, -0.014271736145019531, -0.01315927505493164, -0.01204681396484375, -0.01093435287475586, -0.009821891784667969, -0.008709430694580078, -0.0075969696044921875, -0.006484508514404297, -0.005372047424316406, -0.004259586334228516, -0.003147125244140625, -0.0020346641540527344, -0.0009222030639648438, 0.00019025802612304688, 0.0013027191162109375, 0.002415180206298828, 0.0035276412963867188, 0.004640102386474609, 0.0057525634765625, 0.006865024566650391, 0.007977485656738281, 0.009089946746826172, 0.010202407836914062, 0.011314868927001953, 0.012427330017089844, 0.013539791107177734, 0.014652252197265625, 0.015764713287353516, 0.016877174377441406, 0.017989635467529297, 0.019102096557617188, 0.020214557647705078, 0.02132701873779297, 0.02243947982788086, 0.02355194091796875, 0.02466440200805664, 0.02577686309814453, 0.026889324188232422, 0.028001785278320312, 0.029114246368408203, 0.030226707458496094, 0.031339168548583984, 0.032451629638671875, 0.033564090728759766, 0.034676551818847656, 0.03578901290893555, 0.03690147399902344, 0.03801393508911133, 0.03912639617919922, 0.04023885726928711, 0.041351318359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 6.0, 10.0, 20.0, 18.0, 29.0, 31.0, 60.0, 84.0, 104.0, 135.0, 227.0, 313.0, 495.0, 642.0, 531.0, 391.0, 302.0, 187.0, 139.0, 101.0, 63.0, 54.0, 27.0, 31.0, 21.0, 19.0, 7.0, 10.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01004791259765625, -0.009709000587463379, -0.009370088577270508, -0.009031176567077637, -0.008692264556884766, -0.008353352546691895, -0.008014440536499023, -0.007675528526306152, -0.007336616516113281, -0.00699770450592041, -0.006658792495727539, -0.006319880485534668, -0.005980968475341797, -0.005642056465148926, -0.005303144454956055, -0.004964232444763184, -0.0046253204345703125, -0.004286408424377441, -0.00394749641418457, -0.0036085844039916992, -0.003269672393798828, -0.002930760383605957, -0.002591848373413086, -0.002252936363220215, -0.0019140243530273438, -0.0015751123428344727, -0.0012362003326416016, -0.0008972883224487305, -0.0005583763122558594, -0.00021946430206298828, 0.00011944770812988281, 0.0004583597183227539, 0.000797271728515625, 0.001136183738708496, 0.0014750957489013672, 0.0018140077590942383, 0.0021529197692871094, 0.0024918317794799805, 0.0028307437896728516, 0.0031696557998657227, 0.0035085678100585938, 0.003847479820251465, 0.004186391830444336, 0.004525303840637207, 0.004864215850830078, 0.005203127861022949, 0.00554203987121582, 0.005880951881408691, 0.0062198638916015625, 0.006558775901794434, 0.006897687911987305, 0.007236599922180176, 0.007575511932373047, 0.007914423942565918, 0.008253335952758789, 0.00859224796295166, 0.008931159973144531, 0.009270071983337402, 0.009608983993530273, 0.009947896003723145, 0.010286808013916016, 0.010625720024108887, 0.010964632034301758, 0.011303544044494629, 0.0116424560546875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 20.0, 198.0, 542.0, 200.0, 26.0, 12.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25941604375839233, -0.2524815797805786, -0.2455471158027649, -0.23861265182495117, -0.23167817294597626, -0.22474370896816254, -0.21780924499034882, -0.2108747810125351, -0.20394031703472137, -0.19700585305690765, -0.19007138907909393, -0.18313691020011902, -0.1762024462223053, -0.16926798224449158, -0.16233351826667786, -0.15539905428886414, -0.14846459031105042, -0.1415301263332367, -0.13459566235542297, -0.12766119837760925, -0.12072672694921494, -0.11379225552082062, -0.1068577915430069, -0.09992332756519318, -0.09298884868621826, -0.08605438470840454, -0.07911991328001022, -0.0721854493021965, -0.06525098532438278, -0.05831651762127876, -0.051382049918174744, -0.04444758594036102, -0.0375131219625473, -0.030578656122088432, -0.023644190281629562, -0.016709722578525543, -0.009775256738066673, -0.0028407908976078033, 0.004093676805496216, 0.011028140783309937, 0.017962608486413956, 0.024897074326872826, 0.031831540167331696, 0.038766007870435715, 0.045700475573539734, 0.052634939551353455, 0.059569407254457474, 0.0665038675069809, 0.07343833893537521, 0.08037280291318893, 0.08730727434158325, 0.09424173831939697, 0.1011762022972107, 0.10811066627502441, 0.11504513770341873, 0.12197960168123245, 0.12891407310962677, 0.1358485370874405, 0.1427830010652542, 0.14971747994422913, 0.15665194392204285, 0.16358640789985657, 0.1705208718776703, 0.177455335855484, 0.18438979983329773]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 6.0, 11.0, 15.0, 19.0, 26.0, 33.0, 41.0, 37.0, 48.0, 51.0, 63.0, 50.0, 50.0, 61.0, 49.0, 49.0, 59.0, 45.0, 49.0, 45.0, 44.0, 29.0, 19.0, 23.0, 20.0, 14.0, 9.0, 11.0, 5.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.05988001823425293, -0.05845063924789429, -0.05702126398682594, -0.0555918887257576, -0.054162509739398956, -0.052733130753040314, -0.05130375549197197, -0.049874380230903625, -0.04844500124454498, -0.04701562225818634, -0.045586246997117996, -0.04415687173604965, -0.04272749274969101, -0.04129811376333237, -0.03986873850226402, -0.03843936324119568, -0.037009984254837036, -0.035580605268478394, -0.03415123000741005, -0.032721854746341705, -0.03129247575998306, -0.02986309863626957, -0.028433721512556076, -0.027004344388842583, -0.02557496726512909, -0.024145590141415596, -0.022716213017702103, -0.02128683589398861, -0.019857458770275116, -0.018428081646561623, -0.01699870452284813, -0.015569327399134636, -0.014139950275421143, -0.01271057315170765, -0.011281196027994156, -0.009851818904280663, -0.00842244178056717, -0.006993064656853676, -0.0055636875331401825, -0.004134310409426689, -0.002704933285713196, -0.0012755561619997025, 0.0001538209617137909, 0.0015831980854272842, 0.0030125752091407776, 0.004441952332854271, 0.005871329456567764, 0.007300706580281258, 0.008730083703994751, 0.010159460827708244, 0.011588837951421738, 0.013018215075135231, 0.014447592198848724, 0.015876969322562218, 0.01730634644627571, 0.018735723569989204, 0.020165100693702698, 0.02159447781741619, 0.023023854941129684, 0.024453232064843178, 0.02588260918855667, 0.027311986312270164, 0.028741363435983658, 0.03017074055969715, 0.031600117683410645]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 3.0, 4.0, 4.0, 1.0, 6.0, 5.0, 9.0, 15.0, 25.0, 29.0, 44.0, 75.0, 109.0, 123.0, 241.0, 427.0, 654.0, 1389.0, 6929.0, 555890.0, 473217.0, 6183.0, 1381.0, 666.0, 411.0, 236.0, 173.0, 99.0, 69.0, 55.0, 24.0, 19.0, 18.0, 7.0, 10.0, 7.0, 1.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05535888671875, -0.053680419921875, -0.052001953125, -0.050323486328125, -0.04864501953125, -0.046966552734375, -0.0452880859375, -0.043609619140625, -0.04193115234375, -0.040252685546875, -0.03857421875, -0.036895751953125, -0.03521728515625, -0.033538818359375, -0.0318603515625, -0.030181884765625, -0.02850341796875, -0.026824951171875, -0.025146484375, -0.023468017578125, -0.02178955078125, -0.020111083984375, -0.0184326171875, -0.016754150390625, -0.01507568359375, -0.013397216796875, -0.01171875, -0.010040283203125, -0.00836181640625, -0.006683349609375, -0.0050048828125, -0.003326416015625, -0.00164794921875, 3.0517578125e-05, 0.001708984375, 0.003387451171875, 0.00506591796875, 0.006744384765625, 0.0084228515625, 0.010101318359375, 0.01177978515625, 0.013458251953125, 0.01513671875, 0.016815185546875, 0.01849365234375, 0.020172119140625, 0.0218505859375, 0.023529052734375, 0.02520751953125, 0.026885986328125, 0.028564453125, 0.030242919921875, 0.03192138671875, 0.033599853515625, 0.0352783203125, 0.036956787109375, 0.03863525390625, 0.040313720703125, 0.0419921875, 0.043670654296875, 0.04534912109375, 0.047027587890625, 0.0487060546875, 0.050384521484375, 0.05206298828125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 41.0, 106.0, 220.0, 254.0, 204.0, 123.0, 30.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0169677734375, -0.01639246940612793, -0.01581716537475586, -0.015241861343383789, -0.014666557312011719, -0.014091253280639648, -0.013515949249267578, -0.012940645217895508, -0.012365341186523438, -0.011790037155151367, -0.011214733123779297, -0.010639429092407227, -0.010064125061035156, -0.009488821029663086, -0.008913516998291016, -0.008338212966918945, -0.007762908935546875, -0.007187604904174805, -0.006612300872802734, -0.006036996841430664, -0.005461692810058594, -0.0048863887786865234, -0.004311084747314453, -0.003735780715942383, -0.0031604766845703125, -0.002585172653198242, -0.002009868621826172, -0.0014345645904541016, -0.0008592605590820312, -0.00028395652770996094, 0.0002913475036621094, 0.0008666515350341797, 0.00144195556640625, 0.0020172595977783203, 0.0025925636291503906, 0.003167867660522461, 0.0037431716918945312, 0.0043184757232666016, 0.004893779754638672, 0.005469083786010742, 0.0060443878173828125, 0.006619691848754883, 0.007194995880126953, 0.0077702999114990234, 0.008345603942871094, 0.008920907974243164, 0.009496212005615234, 0.010071516036987305, 0.010646820068359375, 0.011222124099731445, 0.011797428131103516, 0.012372732162475586, 0.012948036193847656, 0.013523340225219727, 0.014098644256591797, 0.014673948287963867, 0.015249252319335938, 0.015824556350708008, 0.016399860382080078, 0.01697516441345215, 0.01755046844482422, 0.01812577247619629, 0.01870107650756836, 0.01927638053894043, 0.0198516845703125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 8.0, 12.0, 9.0, 19.0, 17.0, 35.0, 51.0, 61.0, 82.0, 101.0, 150.0, 214.0, 329.0, 670.0, 1300.0, 3374.0, 11140.0, 60423.0, 410241.0, 467967.0, 72445.0, 12942.0, 3738.0, 1416.0, 717.0, 373.0, 200.0, 136.0, 111.0, 70.0, 47.0, 44.0, 38.0, 19.0, 18.0, 15.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0205841064453125, -0.020013093948364258, -0.019442081451416016, -0.018871068954467773, -0.01830005645751953, -0.01772904396057129, -0.017158031463623047, -0.016587018966674805, -0.016016006469726562, -0.01544499397277832, -0.014873981475830078, -0.014302968978881836, -0.013731956481933594, -0.013160943984985352, -0.01258993148803711, -0.012018918991088867, -0.011447906494140625, -0.010876893997192383, -0.01030588150024414, -0.009734869003295898, -0.009163856506347656, -0.008592844009399414, -0.008021831512451172, -0.00745081901550293, -0.0068798065185546875, -0.006308794021606445, -0.005737781524658203, -0.005166769027709961, -0.004595756530761719, -0.0040247440338134766, -0.0034537315368652344, -0.002882719039916992, -0.00231170654296875, -0.0017406940460205078, -0.0011696815490722656, -0.0005986690521240234, -2.765655517578125e-05, 0.0005433559417724609, 0.0011143684387207031, 0.0016853809356689453, 0.0022563934326171875, 0.0028274059295654297, 0.003398418426513672, 0.003969430923461914, 0.004540443420410156, 0.0051114559173583984, 0.005682468414306641, 0.006253480911254883, 0.006824493408203125, 0.007395505905151367, 0.00796651840209961, 0.008537530899047852, 0.009108543395996094, 0.009679555892944336, 0.010250568389892578, 0.01082158088684082, 0.011392593383789062, 0.011963605880737305, 0.012534618377685547, 0.013105630874633789, 0.013676643371582031, 0.014247655868530273, 0.014818668365478516, 0.015389680862426758, 0.015960693359375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 8.0, 9.0, 5.0, 11.0, 14.0, 21.0, 19.0, 19.0, 22.0, 23.0, 19.0, 34.0, 31.0, 28.0, 54.0, 50.0, 54.0, 45.0, 46.0, 41.0, 48.0, 57.0, 41.0, 35.0, 40.0, 35.0, 29.0, 22.0, 23.0, 27.0, 20.0, 20.0, 10.0, 14.0, 9.0, 8.0, 5.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01031494140625, -0.009937524795532227, -0.009560108184814453, -0.00918269157409668, -0.008805274963378906, -0.008427858352661133, -0.00805044174194336, -0.007673025131225586, -0.0072956085205078125, -0.006918191909790039, -0.006540775299072266, -0.006163358688354492, -0.005785942077636719, -0.005408525466918945, -0.005031108856201172, -0.0046536922454833984, -0.004276275634765625, -0.0038988590240478516, -0.003521442413330078, -0.0031440258026123047, -0.0027666091918945312, -0.002389192581176758, -0.0020117759704589844, -0.001634359359741211, -0.0012569427490234375, -0.0008795261383056641, -0.0005021095275878906, -0.0001246929168701172, 0.00025272369384765625, 0.0006301403045654297, 0.0010075569152832031, 0.0013849735260009766, 0.00176239013671875, 0.0021398067474365234, 0.002517223358154297, 0.0028946399688720703, 0.0032720565795898438, 0.003649473190307617, 0.004026889801025391, 0.004404306411743164, 0.0047817230224609375, 0.005159139633178711, 0.005536556243896484, 0.005913972854614258, 0.006291389465332031, 0.006668806076049805, 0.007046222686767578, 0.0074236392974853516, 0.007801055908203125, 0.008178472518920898, 0.008555889129638672, 0.008933305740356445, 0.009310722351074219, 0.009688138961791992, 0.010065555572509766, 0.010442972183227539, 0.010820388793945312, 0.011197805404663086, 0.01157522201538086, 0.011952638626098633, 0.012330055236816406, 0.01270747184753418, 0.013084888458251953, 0.013462305068969727, 0.0138397216796875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 10.0, 7.0, 10.0, 15.0, 27.0, 32.0, 46.0, 75.0, 147.0, 259.0, 427.0, 846.0, 1690.0, 3580.0, 9713.0, 50437.0, 633139.0, 308926.0, 26531.0, 6911.0, 2795.0, 1352.0, 655.0, 350.0, 226.0, 126.0, 68.0, 50.0, 29.0, 20.0, 16.0, 9.0, 4.0, 4.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.009124755859375, -0.008828878402709961, -0.008533000946044922, -0.008237123489379883, -0.007941246032714844, -0.007645368576049805, -0.007349491119384766, -0.0070536136627197266, -0.0067577362060546875, -0.0064618587493896484, -0.006165981292724609, -0.00587010383605957, -0.005574226379394531, -0.005278348922729492, -0.004982471466064453, -0.004686594009399414, -0.004390716552734375, -0.004094839096069336, -0.003798961639404297, -0.003503084182739258, -0.0032072067260742188, -0.0029113292694091797, -0.0026154518127441406, -0.0023195743560791016, -0.0020236968994140625, -0.0017278194427490234, -0.0014319419860839844, -0.0011360645294189453, -0.0008401870727539062, -0.0005443096160888672, -0.0002484321594238281, 4.744529724121094e-05, 0.00034332275390625, 0.0006392002105712891, 0.0009350776672363281, 0.0012309551239013672, 0.0015268325805664062, 0.0018227100372314453, 0.0021185874938964844, 0.0024144649505615234, 0.0027103424072265625, 0.0030062198638916016, 0.0033020973205566406, 0.0035979747772216797, 0.0038938522338867188, 0.004189729690551758, 0.004485607147216797, 0.004781484603881836, 0.005077362060546875, 0.005373239517211914, 0.005669116973876953, 0.005964994430541992, 0.006260871887207031, 0.00655674934387207, 0.006852626800537109, 0.0071485042572021484, 0.0074443817138671875, 0.0077402591705322266, 0.008036136627197266, 0.008332014083862305, 0.008627891540527344, 0.008923768997192383, 0.009219646453857422, 0.009515523910522461, 0.0098114013671875]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 4.0, 9.0, 9.0, 8.0, 10.0, 16.0, 17.0, 17.0, 24.0, 34.0, 39.0, 36.0, 39.0, 55.0, 61.0, 101.0, 91.0, 61.0, 48.0, 62.0, 33.0, 33.0, 34.0, 33.0, 26.0, 17.0, 10.0, 21.0, 3.0, 11.0, 10.0, 7.0, 3.0, 5.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.164478302001953e-05, -6.9422647356987e-05, -6.720051169395447e-05, -6.497837603092194e-05, -6.27562403678894e-05, -6.053410470485687e-05, -5.831196904182434e-05, -5.608983337879181e-05, -5.386769771575928e-05, -5.1645562052726746e-05, -4.9423426389694214e-05, -4.720129072666168e-05, -4.497915506362915e-05, -4.275701940059662e-05, -4.053488373756409e-05, -3.8312748074531555e-05, -3.6090612411499023e-05, -3.386847674846649e-05, -3.164634108543396e-05, -2.9424205422401428e-05, -2.7202069759368896e-05, -2.4979934096336365e-05, -2.2757798433303833e-05, -2.05356627702713e-05, -1.831352710723877e-05, -1.6091391444206238e-05, -1.3869255781173706e-05, -1.1647120118141174e-05, -9.424984455108643e-06, -7.202848792076111e-06, -4.980713129043579e-06, -2.7585774660110474e-06, -5.364418029785156e-07, 1.6856938600540161e-06, 3.907829523086548e-06, 6.12996518611908e-06, 8.352100849151611e-06, 1.0574236512184143e-05, 1.2796372175216675e-05, 1.5018507838249207e-05, 1.7240643501281738e-05, 1.946277916431427e-05, 2.1684914827346802e-05, 2.3907050490379333e-05, 2.6129186153411865e-05, 2.8351321816444397e-05, 3.057345747947693e-05, 3.279559314250946e-05, 3.501772880554199e-05, 3.7239864468574524e-05, 3.9462000131607056e-05, 4.168413579463959e-05, 4.390627145767212e-05, 4.612840712070465e-05, 4.835054278373718e-05, 5.0572678446769714e-05, 5.2794814109802246e-05, 5.501694977283478e-05, 5.723908543586731e-05, 5.946122109889984e-05, 6.168335676193237e-05, 6.39054924249649e-05, 6.612762808799744e-05, 6.834976375102997e-05, 7.05718994140625e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 11.0, 26.0, 17.0, 42.0, 65.0, 94.0, 220.0, 315.0, 593.0, 1198.0, 2434.0, 5313.0, 15129.0, 100262.0, 745527.0, 146805.0, 18738.0, 6104.0, 2751.0, 1361.0, 640.0, 389.0, 216.0, 105.0, 54.0, 38.0, 16.0, 14.0, 11.0, 10.0, 13.0, 6.0, 2.0, 1.0, 7.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00913238525390625, -0.008852005004882812, -0.008571624755859375, -0.008291244506835938, -0.0080108642578125, -0.0077304840087890625, -0.007450103759765625, -0.0071697235107421875, -0.00688934326171875, -0.0066089630126953125, -0.006328582763671875, -0.0060482025146484375, -0.005767822265625, -0.0054874420166015625, -0.005207061767578125, -0.0049266815185546875, -0.00464630126953125, -0.0043659210205078125, -0.004085540771484375, -0.0038051605224609375, -0.0035247802734375, -0.0032444000244140625, -0.002964019775390625, -0.0026836395263671875, -0.00240325927734375, -0.0021228790283203125, -0.001842498779296875, -0.0015621185302734375, -0.00128173828125, -0.0010013580322265625, -0.000720977783203125, -0.0004405975341796875, -0.00016021728515625, 0.0001201629638671875, 0.000400543212890625, 0.0006809234619140625, 0.0009613037109375, 0.0012416839599609375, 0.001522064208984375, 0.0018024444580078125, 0.00208282470703125, 0.0023632049560546875, 0.002643585205078125, 0.0029239654541015625, 0.003204345703125, 0.0034847259521484375, 0.003765106201171875, 0.0040454864501953125, 0.00432586669921875, 0.0046062469482421875, 0.004886627197265625, 0.0051670074462890625, 0.0054473876953125, 0.0057277679443359375, 0.006008148193359375, 0.0062885284423828125, 0.00656890869140625, 0.0068492889404296875, 0.007129669189453125, 0.0074100494384765625, 0.0076904296875, 0.007970809936523438, 0.008251190185546875, 0.008531570434570312, 0.00881195068359375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 7.0, 8.0, 20.0, 27.0, 25.0, 50.0, 64.0, 82.0, 123.0, 120.0, 119.0, 119.0, 73.0, 50.0, 27.0, 25.0, 13.0, 11.0, 4.0, 1.0, 9.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006717681884765625, -0.006518185138702393, -0.00631868839263916, -0.006119191646575928, -0.005919694900512695, -0.005720198154449463, -0.0055207014083862305, -0.005321204662322998, -0.005121707916259766, -0.004922211170196533, -0.004722714424133301, -0.004523217678070068, -0.004323720932006836, -0.0041242241859436035, -0.003924727439880371, -0.0037252306938171387, -0.0035257339477539062, -0.003326237201690674, -0.0031267404556274414, -0.002927243709564209, -0.0027277469635009766, -0.002528250217437744, -0.0023287534713745117, -0.0021292567253112793, -0.0019297599792480469, -0.0017302632331848145, -0.001530766487121582, -0.0013312697410583496, -0.0011317729949951172, -0.0009322762489318848, -0.0007327795028686523, -0.0005332827568054199, -0.0003337860107421875, -0.00013428926467895508, 6.520748138427734e-05, 0.00026470422744750977, 0.0004642009735107422, 0.0006636977195739746, 0.000863194465637207, 0.0010626912117004395, 0.0012621879577636719, 0.0014616847038269043, 0.0016611814498901367, 0.0018606781959533691, 0.0020601749420166016, 0.002259671688079834, 0.0024591684341430664, 0.002658665180206299, 0.0028581619262695312, 0.0030576586723327637, 0.003257155418395996, 0.0034566521644592285, 0.003656148910522461, 0.0038556456565856934, 0.004055142402648926, 0.004254639148712158, 0.004454135894775391, 0.004653632640838623, 0.0048531293869018555, 0.005052626132965088, 0.00525212287902832, 0.005451619625091553, 0.005651116371154785, 0.005850613117218018, 0.00605010986328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 14.0, 321.0, 596.0, 58.0, 17.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08801757544279099, -0.07925599068403244, -0.0704943984746933, -0.06173281371593475, -0.05297122523188591, -0.04420963674783707, -0.03544805198907852, -0.02668646350502968, -0.017924875020980835, -0.009163287468254566, -0.0004016999155282974, 0.008359886705875397, 0.01712147518992424, 0.025883063673973083, 0.03464464843273163, 0.04340623691678047, 0.052167825400829315, 0.06092941388487816, 0.069691002368927, 0.07845258712768555, 0.08721417188644409, 0.09597576409578323, 0.10473734885454178, 0.11349894106388092, 0.12226052582263947, 0.131022110581398, 0.13978369534015656, 0.1485452950000763, 0.15730687975883484, 0.16606846451759338, 0.17483004927635193, 0.18359163403511047, 0.19235321879386902, 0.20111480355262756, 0.2098763883113861, 0.21863797307014465, 0.2273995727300644, 0.23616115748882294, 0.24492274224758148, 0.2536843419075012, 0.26244592666625977, 0.2712075114250183, 0.27996909618377686, 0.2887306809425354, 0.29749226570129395, 0.3062538504600525, 0.31501543521881104, 0.32377704977989197, 0.3325386047363281, 0.34130018949508667, 0.3500617742538452, 0.35882335901260376, 0.3675849437713623, 0.37634652853012085, 0.3851081132888794, 0.3938697278499603, 0.40263131260871887, 0.4113928973674774, 0.42015448212623596, 0.4289160668849945, 0.43767765164375305, 0.446439266204834, 0.45520085096359253, 0.4639624357223511, 0.4727240204811096]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 7.0, 7.0, 11.0, 24.0, 22.0, 33.0, 15.0, 41.0, 38.0, 42.0, 47.0, 47.0, 51.0, 51.0, 68.0, 47.0, 55.0, 53.0, 46.0, 51.0, 41.0, 34.0, 34.0, 30.0, 18.0, 20.0, 16.0, 9.0, 10.0, 6.0, 5.0, 3.0, 2.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.0587925910949707, -0.05727876350283623, -0.05576493591070175, -0.05425110459327698, -0.0527372770011425, -0.051223449409008026, -0.04970961809158325, -0.048195790499448776, -0.0466819629073143, -0.045168135315179825, -0.04365430772304535, -0.042140476405620575, -0.0406266488134861, -0.039112821221351624, -0.03759898990392685, -0.036085162311792374, -0.0345713347196579, -0.03305750712752342, -0.03154367953538895, -0.030029848217964172, -0.028516020625829697, -0.02700219303369522, -0.025488363578915596, -0.02397453412413597, -0.022460706532001495, -0.02094687893986702, -0.019433049485087395, -0.01791922003030777, -0.016405392438173294, -0.014891563914716244, -0.013377735391259193, -0.011863906867802143, -0.010350078344345093, -0.008836249820888042, -0.007322421297430992, -0.005808592773973942, -0.0042947642505168915, -0.002780935727059841, -0.0012671072036027908, 0.0002467213198542595, 0.0017605498433113098, 0.00327437836676836, 0.0047882068902254105, 0.006302035413682461, 0.007815863937139511, 0.009329692460596561, 0.010843520984053612, 0.012357349507510662, 0.013871178030967712, 0.015385006554424763, 0.016898835077881813, 0.018412664532661438, 0.019926492124795914, 0.02144031971693039, 0.022954149171710014, 0.02446797862648964, 0.025981806218624115, 0.02749563381075859, 0.029009463265538216, 0.03052329272031784, 0.032037120312452316, 0.03355094790458679, 0.035064779222011566, 0.03657860681414604, 0.03809243440628052]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 10.0, 8.0, 14.0, 15.0, 36.0, 60.0, 103.0, 162.0, 305.0, 545.0, 1085.0, 3635.0, 10355.0, 877198.0, 3279855.0, 15663.0, 2881.0, 965.0, 490.0, 328.0, 190.0, 131.0, 83.0, 55.0, 41.0, 21.0, 17.0, 14.0, 9.0, 1.0, 5.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0299530029296875, -0.02870965003967285, -0.027466297149658203, -0.026222944259643555, -0.024979591369628906, -0.023736238479614258, -0.02249288558959961, -0.02124953269958496, -0.020006179809570312, -0.018762826919555664, -0.017519474029541016, -0.016276121139526367, -0.015032768249511719, -0.01378941535949707, -0.012546062469482422, -0.011302709579467773, -0.010059356689453125, -0.008816003799438477, -0.007572650909423828, -0.00632929801940918, -0.005085945129394531, -0.003842592239379883, -0.0025992393493652344, -0.001355886459350586, -0.0001125335693359375, 0.001130819320678711, 0.0023741722106933594, 0.003617525100708008, 0.004860877990722656, 0.006104230880737305, 0.007347583770751953, 0.008590936660766602, 0.00983428955078125, 0.011077642440795898, 0.012320995330810547, 0.013564348220825195, 0.014807701110839844, 0.016051054000854492, 0.01729440689086914, 0.01853775978088379, 0.019781112670898438, 0.021024465560913086, 0.022267818450927734, 0.023511171340942383, 0.02475452423095703, 0.02599787712097168, 0.027241230010986328, 0.028484582901000977, 0.029727935791015625, 0.030971288681030273, 0.03221464157104492, 0.03345799446105957, 0.03470134735107422, 0.03594470024108887, 0.037188053131103516, 0.038431406021118164, 0.03967475891113281, 0.04091811180114746, 0.04216146469116211, 0.04340481758117676, 0.044648170471191406, 0.045891523361206055, 0.0471348762512207, 0.04837822914123535, 0.04962158203125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 23.0, 83.0, 168.0, 232.0, 242.0, 158.0, 67.0, 19.0, 4.0, 2.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.017822265625, -0.0172271728515625, -0.016632080078125, -0.0160369873046875, -0.01544189453125, -0.0148468017578125, -0.014251708984375, -0.0136566162109375, -0.0130615234375, -0.0124664306640625, -0.011871337890625, -0.0112762451171875, -0.01068115234375, -0.0100860595703125, -0.009490966796875, -0.0088958740234375, -0.00830078125, -0.0077056884765625, -0.007110595703125, -0.0065155029296875, -0.00592041015625, -0.0053253173828125, -0.004730224609375, -0.0041351318359375, -0.0035400390625, -0.0029449462890625, -0.002349853515625, -0.0017547607421875, -0.00115966796875, -0.0005645751953125, 3.0517578125e-05, 0.0006256103515625, 0.001220703125, 0.0018157958984375, 0.002410888671875, 0.0030059814453125, 0.00360107421875, 0.0041961669921875, 0.004791259765625, 0.0053863525390625, 0.0059814453125, 0.0065765380859375, 0.007171630859375, 0.0077667236328125, 0.00836181640625, 0.0089569091796875, 0.009552001953125, 0.0101470947265625, 0.0107421875, 0.0113372802734375, 0.011932373046875, 0.0125274658203125, 0.01312255859375, 0.0137176513671875, 0.014312744140625, 0.0149078369140625, 0.0155029296875, 0.0160980224609375, 0.016693115234375, 0.0172882080078125, 0.01788330078125, 0.0184783935546875, 0.019073486328125, 0.0196685791015625, 0.020263671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 7.0, 2.0, 3.0, 10.0, 9.0, 16.0, 18.0, 24.0, 60.0, 75.0, 110.0, 151.0, 347.0, 744.0, 2591.0, 17151.0, 2792830.0, 1362892.0, 13617.0, 2254.0, 670.0, 285.0, 151.0, 89.0, 52.0, 32.0, 26.0, 23.0, 13.0, 8.0, 9.0, 3.0, 3.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03533935546875, -0.03426694869995117, -0.033194541931152344, -0.032122135162353516, -0.031049728393554688, -0.02997732162475586, -0.02890491485595703, -0.027832508087158203, -0.026760101318359375, -0.025687694549560547, -0.02461528778076172, -0.02354288101196289, -0.022470474243164062, -0.021398067474365234, -0.020325660705566406, -0.019253253936767578, -0.01818084716796875, -0.017108440399169922, -0.016036033630371094, -0.014963626861572266, -0.013891220092773438, -0.01281881332397461, -0.011746406555175781, -0.010673999786376953, -0.009601593017578125, -0.008529186248779297, -0.007456779479980469, -0.006384372711181641, -0.0053119659423828125, -0.004239559173583984, -0.0031671524047851562, -0.002094745635986328, -0.0010223388671875, 5.0067901611328125e-05, 0.0011224746704101562, 0.0021948814392089844, 0.0032672882080078125, 0.004339694976806641, 0.005412101745605469, 0.006484508514404297, 0.007556915283203125, 0.008629322052001953, 0.009701728820800781, 0.01077413558959961, 0.011846542358398438, 0.012918949127197266, 0.013991355895996094, 0.015063762664794922, 0.01613616943359375, 0.017208576202392578, 0.018280982971191406, 0.019353389739990234, 0.020425796508789062, 0.02149820327758789, 0.02257061004638672, 0.023643016815185547, 0.024715423583984375, 0.025787830352783203, 0.02686023712158203, 0.02793264389038086, 0.029005050659179688, 0.030077457427978516, 0.031149864196777344, 0.03222227096557617, 0.033294677734375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 4.0, 8.0, 10.0, 21.0, 13.0, 25.0, 25.0, 54.0, 56.0, 89.0, 111.0, 173.0, 261.0, 407.0, 621.0, 597.0, 505.0, 298.0, 223.0, 141.0, 125.0, 76.0, 53.0, 45.0, 37.0, 25.0, 21.0, 10.0, 6.0, 2.0, 3.0, 4.0, 3.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00888824462890625, -0.008593559265136719, -0.008298873901367188, -0.008004188537597656, -0.007709503173828125, -0.007414817810058594, -0.0071201324462890625, -0.006825447082519531, -0.00653076171875, -0.006236076354980469, -0.0059413909912109375, -0.005646705627441406, -0.005352020263671875, -0.005057334899902344, -0.0047626495361328125, -0.004467964172363281, -0.00417327880859375, -0.0038785934448242188, -0.0035839080810546875, -0.0032892227172851562, -0.002994537353515625, -0.0026998519897460938, -0.0024051666259765625, -0.0021104812622070312, -0.0018157958984375, -0.0015211105346679688, -0.0012264251708984375, -0.0009317398071289062, -0.000637054443359375, -0.00034236907958984375, -4.76837158203125e-05, 0.00024700164794921875, 0.00054168701171875, 0.0008363723754882812, 0.0011310577392578125, 0.0014257431030273438, 0.001720428466796875, 0.0020151138305664062, 0.0023097991943359375, 0.0026044845581054688, 0.002899169921875, 0.0031938552856445312, 0.0034885406494140625, 0.0037832260131835938, 0.004077911376953125, 0.004372596740722656, 0.0046672821044921875, 0.004961967468261719, 0.00525665283203125, 0.005551338195800781, 0.0058460235595703125, 0.006140708923339844, 0.006435394287109375, 0.006730079650878906, 0.0070247650146484375, 0.007319450378417969, 0.0076141357421875, 0.007908821105957031, 0.008203506469726562, 0.008498191833496094, 0.008792877197265625, 0.009087562561035156, 0.009382247924804688, 0.009676933288574219, 0.00997161865234375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 27.0, 71.0, 247.0, 347.0, 192.0, 67.0, 29.0, 9.0, 1.0, 6.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.14066481590270996, -0.13717256486415863, -0.1336803138256073, -0.13018806278705597, -0.12669581174850464, -0.12320356070995331, -0.11971130967140198, -0.11621905863285065, -0.11272680759429932, -0.10923455655574799, -0.10574230551719666, -0.10225005447864532, -0.098757803440094, -0.09526555240154266, -0.09177330136299133, -0.08828105032444, -0.08478880673646927, -0.08129655569791794, -0.07780430465936661, -0.07431205362081528, -0.07081980258226395, -0.06732755154371262, -0.06383530795574188, -0.06034305319190025, -0.05685080215334892, -0.05335855111479759, -0.04986630007624626, -0.04637405276298523, -0.0428818017244339, -0.03938955068588257, -0.03589729964733124, -0.03240504860877991, -0.02891279011964798, -0.02542053908109665, -0.02192828804254532, -0.018436038866639137, -0.014943787828087807, -0.011451536789536476, -0.007959287613630295, -0.004467036575078964, -0.0009747855365276337, 0.0025174650363624096, 0.006009715609252453, 0.009501965716481209, 0.01299421675503254, 0.01648646779358387, 0.01997871696949005, 0.023470968008041382, 0.026963219046592712, 0.030455470085144043, 0.033947721123695374, 0.037439972162246704, 0.040932223200798035, 0.044424474239349365, 0.0479167215526104, 0.05140897259116173, 0.05490122362971306, 0.05839347466826439, 0.06188572570681572, 0.06537797302007675, 0.06887022405862808, 0.07236247509717941, 0.07585472613573074, 0.07934697717428207, 0.0828392282128334]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 9.0, 8.0, 19.0, 22.0, 23.0, 38.0, 45.0, 52.0, 66.0, 78.0, 69.0, 67.0, 71.0, 65.0, 69.0, 48.0, 41.0, 45.0, 42.0, 39.0, 28.0, 17.0, 15.0, 6.0, 8.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046460628509521484, -0.045007091015577316, -0.04355355352163315, -0.04210001602768898, -0.04064647853374481, -0.039192941039800644, -0.037739403545856476, -0.03628586605191231, -0.03483232855796814, -0.03337879106402397, -0.0319252535700798, -0.030471716076135635, -0.029018178582191467, -0.0275646410882473, -0.02611110359430313, -0.024657566100358963, -0.023204028606414795, -0.021750491112470627, -0.02029695361852646, -0.01884341612458229, -0.017389878630638123, -0.015936341136693954, -0.014482803642749786, -0.013029266148805618, -0.01157572865486145, -0.010122191160917282, -0.008668653666973114, -0.007215116173028946, -0.005761578679084778, -0.00430804118514061, -0.0028545036911964417, -0.0014009661972522736, 5.257129669189453e-05, 0.0015061087906360626, 0.0029596462845802307, 0.004413183778524399, 0.005866721272468567, 0.007320258766412735, 0.008773796260356903, 0.010227333754301071, 0.01168087124824524, 0.013134408742189407, 0.014587946236133575, 0.016041483730077744, 0.01749502122402191, 0.01894855871796608, 0.020402096211910248, 0.021855633705854416, 0.023309171199798584, 0.024762708693742752, 0.02621624618768692, 0.027669783681631088, 0.029123321175575256, 0.030576858669519424, 0.03203039616346359, 0.03348393365740776, 0.03493747115135193, 0.0363910086452961, 0.037844546139240265, 0.03929808363318443, 0.0407516211271286, 0.04220515862107277, 0.04365869611501694, 0.045112233608961105, 0.04656577110290527]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 3.0, 1.0, 5.0, 16.0, 2.0, 8.0, 11.0, 16.0, 17.0, 26.0, 24.0, 40.0, 50.0, 73.0, 101.0, 122.0, 180.0, 235.0, 303.0, 439.0, 641.0, 1030.0, 2527.0, 13713.0, 277570.0, 709128.0, 34325.0, 3989.0, 1302.0, 720.0, 540.0, 352.0, 234.0, 215.0, 150.0, 104.0, 86.0, 68.0, 53.0, 36.0, 24.0, 21.0, 14.0, 10.0, 12.0, 11.0, 10.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04833984375, -0.047003746032714844, -0.04566764831542969, -0.04433155059814453, -0.042995452880859375, -0.04165935516357422, -0.04032325744628906, -0.038987159729003906, -0.03765106201171875, -0.036314964294433594, -0.03497886657714844, -0.03364276885986328, -0.032306671142578125, -0.03097057342529297, -0.029634475708007812, -0.028298377990722656, -0.0269622802734375, -0.025626182556152344, -0.024290084838867188, -0.02295398712158203, -0.021617889404296875, -0.02028179168701172, -0.018945693969726562, -0.017609596252441406, -0.01627349853515625, -0.014937400817871094, -0.013601303100585938, -0.012265205383300781, -0.010929107666015625, -0.009593009948730469, -0.008256912231445312, -0.006920814514160156, -0.005584716796875, -0.004248619079589844, -0.0029125213623046875, -0.0015764236450195312, -0.000240325927734375, 0.0010957717895507812, 0.0024318695068359375, 0.0037679672241210938, 0.00510406494140625, 0.006440162658691406, 0.0077762603759765625, 0.009112358093261719, 0.010448455810546875, 0.011784553527832031, 0.013120651245117188, 0.014456748962402344, 0.0157928466796875, 0.017128944396972656, 0.018465042114257812, 0.01980113983154297, 0.021137237548828125, 0.02247333526611328, 0.023809432983398438, 0.025145530700683594, 0.02648162841796875, 0.027817726135253906, 0.029153823852539062, 0.03048992156982422, 0.031826019287109375, 0.03316211700439453, 0.03449821472167969, 0.035834312438964844, 0.03717041015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 7.0, 19.0, 74.0, 193.0, 246.0, 257.0, 154.0, 35.0, 11.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.017822265625, -0.017203807830810547, -0.016585350036621094, -0.01596689224243164, -0.015348434448242188, -0.014729976654052734, -0.014111518859863281, -0.013493061065673828, -0.012874603271484375, -0.012256145477294922, -0.011637687683105469, -0.011019229888916016, -0.010400772094726562, -0.00978231430053711, -0.009163856506347656, -0.008545398712158203, -0.00792694091796875, -0.007308483123779297, -0.006690025329589844, -0.006071567535400391, -0.0054531097412109375, -0.004834651947021484, -0.004216194152832031, -0.003597736358642578, -0.002979278564453125, -0.002360820770263672, -0.0017423629760742188, -0.0011239051818847656, -0.0005054473876953125, 0.00011301040649414062, 0.0007314682006835938, 0.0013499259948730469, 0.0019683837890625, 0.002586841583251953, 0.0032052993774414062, 0.0038237571716308594, 0.0044422149658203125, 0.005060672760009766, 0.005679130554199219, 0.006297588348388672, 0.006916046142578125, 0.007534503936767578, 0.008152961730957031, 0.008771419525146484, 0.009389877319335938, 0.01000833511352539, 0.010626792907714844, 0.011245250701904297, 0.01186370849609375, 0.012482166290283203, 0.013100624084472656, 0.01371908187866211, 0.014337539672851562, 0.014955997467041016, 0.015574455261230469, 0.016192913055419922, 0.016811370849609375, 0.017429828643798828, 0.01804828643798828, 0.018666744232177734, 0.019285202026367188, 0.01990365982055664, 0.020522117614746094, 0.021140575408935547, 0.021759033203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 4.0, 4.0, 10.0, 13.0, 14.0, 11.0, 22.0, 37.0, 37.0, 53.0, 97.0, 120.0, 207.0, 293.0, 489.0, 764.0, 1500.0, 3957.0, 15112.0, 97306.0, 629217.0, 256204.0, 31643.0, 6627.0, 2232.0, 932.0, 549.0, 356.0, 220.0, 146.0, 109.0, 70.0, 59.0, 41.0, 26.0, 21.0, 16.0, 9.0, 11.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.024017333984375, -0.023209095001220703, -0.022400856018066406, -0.02159261703491211, -0.020784378051757812, -0.019976139068603516, -0.01916790008544922, -0.018359661102294922, -0.017551422119140625, -0.016743183135986328, -0.01593494415283203, -0.015126705169677734, -0.014318466186523438, -0.01351022720336914, -0.012701988220214844, -0.011893749237060547, -0.01108551025390625, -0.010277271270751953, -0.009469032287597656, -0.00866079330444336, -0.007852554321289062, -0.007044315338134766, -0.006236076354980469, -0.005427837371826172, -0.004619598388671875, -0.003811359405517578, -0.0030031204223632812, -0.0021948814392089844, -0.0013866424560546875, -0.0005784034729003906, 0.00022983551025390625, 0.0010380744934082031, 0.0018463134765625, 0.002654552459716797, 0.0034627914428710938, 0.004271030426025391, 0.0050792694091796875, 0.005887508392333984, 0.006695747375488281, 0.007503986358642578, 0.008312225341796875, 0.009120464324951172, 0.009928703308105469, 0.010736942291259766, 0.011545181274414062, 0.01235342025756836, 0.013161659240722656, 0.013969898223876953, 0.01477813720703125, 0.015586376190185547, 0.016394615173339844, 0.01720285415649414, 0.018011093139648438, 0.018819332122802734, 0.01962757110595703, 0.020435810089111328, 0.021244049072265625, 0.022052288055419922, 0.02286052703857422, 0.023668766021728516, 0.024477005004882812, 0.02528524398803711, 0.026093482971191406, 0.026901721954345703, 0.0277099609375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 13.0, 10.0, 7.0, 11.0, 9.0, 20.0, 17.0, 18.0, 27.0, 25.0, 33.0, 25.0, 30.0, 40.0, 52.0, 45.0, 44.0, 40.0, 41.0, 38.0, 37.0, 28.0, 40.0, 34.0, 35.0, 45.0, 31.0, 25.0, 34.0, 22.0, 14.0, 22.0, 17.0, 12.0, 12.0, 7.0, 10.0, 2.0, 11.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.01218414306640625, -0.011808991432189941, -0.011433839797973633, -0.011058688163757324, -0.010683536529541016, -0.010308384895324707, -0.009933233261108398, -0.00955808162689209, -0.009182929992675781, -0.008807778358459473, -0.008432626724243164, -0.008057475090026855, -0.007682323455810547, -0.007307171821594238, -0.00693202018737793, -0.006556868553161621, -0.0061817169189453125, -0.005806565284729004, -0.005431413650512695, -0.005056262016296387, -0.004681110382080078, -0.0043059587478637695, -0.003930807113647461, -0.0035556554794311523, -0.0031805038452148438, -0.002805352210998535, -0.0024302005767822266, -0.002055048942565918, -0.0016798973083496094, -0.0013047456741333008, -0.0009295940399169922, -0.0005544424057006836, -0.000179290771484375, 0.0001958608627319336, 0.0005710124969482422, 0.0009461641311645508, 0.0013213157653808594, 0.001696467399597168, 0.0020716190338134766, 0.002446770668029785, 0.0028219223022460938, 0.0031970739364624023, 0.003572225570678711, 0.0039473772048950195, 0.004322528839111328, 0.004697680473327637, 0.005072832107543945, 0.005447983741760254, 0.0058231353759765625, 0.006198287010192871, 0.00657343864440918, 0.006948590278625488, 0.007323741912841797, 0.0076988935470581055, 0.008074045181274414, 0.008449196815490723, 0.008824348449707031, 0.00919950008392334, 0.009574651718139648, 0.009949803352355957, 0.010324954986572266, 0.010700106620788574, 0.011075258255004883, 0.011450409889221191, 0.0118255615234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 4.0, 5.0, 11.0, 19.0, 22.0, 31.0, 44.0, 68.0, 145.0, 225.0, 409.0, 967.0, 2505.0, 8571.0, 42659.0, 560637.0, 388645.0, 32633.0, 7108.0, 2125.0, 852.0, 368.0, 202.0, 102.0, 53.0, 41.0, 25.0, 26.0, 10.0, 13.0, 5.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01122283935546875, -0.010820984840393066, -0.010419130325317383, -0.0100172758102417, -0.009615421295166016, -0.009213566780090332, -0.008811712265014648, -0.008409857749938965, -0.008008003234863281, -0.007606148719787598, -0.007204294204711914, -0.0068024396896362305, -0.006400585174560547, -0.005998730659484863, -0.00559687614440918, -0.005195021629333496, -0.0047931671142578125, -0.004391312599182129, -0.003989458084106445, -0.0035876035690307617, -0.003185749053955078, -0.0027838945388793945, -0.002382040023803711, -0.0019801855087280273, -0.0015783309936523438, -0.0011764764785766602, -0.0007746219635009766, -0.00037276744842529297, 2.9087066650390625e-05, 0.0004309415817260742, 0.0008327960968017578, 0.0012346506118774414, 0.001636505126953125, 0.0020383596420288086, 0.002440214157104492, 0.0028420686721801758, 0.0032439231872558594, 0.003645777702331543, 0.0040476322174072266, 0.00444948673248291, 0.004851341247558594, 0.005253195762634277, 0.005655050277709961, 0.0060569047927856445, 0.006458759307861328, 0.006860613822937012, 0.007262468338012695, 0.007664322853088379, 0.008066177368164062, 0.008468031883239746, 0.00886988639831543, 0.009271740913391113, 0.009673595428466797, 0.01007544994354248, 0.010477304458618164, 0.010879158973693848, 0.011281013488769531, 0.011682868003845215, 0.012084722518920898, 0.012486577033996582, 0.012888431549072266, 0.01329028606414795, 0.013692140579223633, 0.014093995094299316, 0.014495849609375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 2.0, 4.0, 8.0, 7.0, 18.0, 15.0, 25.0, 40.0, 28.0, 56.0, 73.0, 88.0, 111.0, 102.0, 90.0, 77.0, 58.0, 45.0, 34.0, 34.0, 23.0, 15.0, 14.0, 5.0, 6.0, 7.0, 3.0, 3.0, 3.0, 2.0, 5.0, 2.0], "bins": [-0.00015151500701904297, -0.00014815572649240494, -0.0001447964459657669, -0.00014143716543912888, -0.00013807788491249084, -0.00013471860438585281, -0.00013135932385921478, -0.00012800004333257675, -0.00012464076280593872, -0.00012128148227930069, -0.00011792220175266266, -0.00011456292122602463, -0.0001112036406993866, -0.00010784436017274857, -0.00010448507964611053, -0.0001011257991194725, -9.776651859283447e-05, -9.440723806619644e-05, -9.104795753955841e-05, -8.768867701292038e-05, -8.432939648628235e-05, -8.097011595964432e-05, -7.761083543300629e-05, -7.425155490636826e-05, -7.089227437973022e-05, -6.75329938530922e-05, -6.417371332645416e-05, -6.081443279981613e-05, -5.74551522731781e-05, -5.409587174654007e-05, -5.073659121990204e-05, -4.737731069326401e-05, -4.4018030166625977e-05, -4.0658749639987946e-05, -3.7299469113349915e-05, -3.3940188586711884e-05, -3.058090806007385e-05, -2.722162753343582e-05, -2.386234700679779e-05, -2.050306648015976e-05, -1.714378595352173e-05, -1.3784505426883698e-05, -1.0425224900245667e-05, -7.0659443736076355e-06, -3.7066638469696045e-06, -3.473833203315735e-07, 3.0118972063064575e-06, 6.3711777329444885e-06, 9.73045825958252e-06, 1.308973878622055e-05, 1.644901931285858e-05, 1.9808299839496613e-05, 2.3167580366134644e-05, 2.6526860892772675e-05, 2.9886141419410706e-05, 3.3245421946048737e-05, 3.660470247268677e-05, 3.99639829993248e-05, 4.332326352596283e-05, 4.668254405260086e-05, 5.004182457923889e-05, 5.340110510587692e-05, 5.6760385632514954e-05, 6.0119666159152985e-05, 6.347894668579102e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 10.0, 9.0, 16.0, 17.0, 28.0, 33.0, 36.0, 64.0, 92.0, 135.0, 218.0, 508.0, 1497.0, 6852.0, 60354.0, 877746.0, 88860.0, 8861.0, 1808.0, 592.0, 299.0, 163.0, 105.0, 72.0, 48.0, 31.0, 24.0, 19.0, 11.0, 8.0, 7.0, 8.0, 4.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016265869140625, -0.015781283378601074, -0.015296697616577148, -0.014812111854553223, -0.014327526092529297, -0.013842940330505371, -0.013358354568481445, -0.01287376880645752, -0.012389183044433594, -0.011904597282409668, -0.011420011520385742, -0.010935425758361816, -0.01045083999633789, -0.009966254234313965, -0.009481668472290039, -0.008997082710266113, -0.008512496948242188, -0.008027911186218262, -0.007543325424194336, -0.00705873966217041, -0.006574153900146484, -0.006089568138122559, -0.005604982376098633, -0.005120396614074707, -0.004635810852050781, -0.0041512250900268555, -0.0036666393280029297, -0.003182053565979004, -0.002697467803955078, -0.0022128820419311523, -0.0017282962799072266, -0.0012437105178833008, -0.000759124755859375, -0.0002745389938354492, 0.00021004676818847656, 0.0006946325302124023, 0.0011792182922363281, 0.001663804054260254, 0.0021483898162841797, 0.0026329755783081055, 0.0031175613403320312, 0.003602147102355957, 0.004086732864379883, 0.004571318626403809, 0.005055904388427734, 0.00554049015045166, 0.006025075912475586, 0.006509661674499512, 0.0069942474365234375, 0.007478833198547363, 0.007963418960571289, 0.008448004722595215, 0.00893259048461914, 0.009417176246643066, 0.009901762008666992, 0.010386347770690918, 0.010870933532714844, 0.01135551929473877, 0.011840105056762695, 0.012324690818786621, 0.012809276580810547, 0.013293862342834473, 0.013778448104858398, 0.014263033866882324, 0.01474761962890625]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 2.0, 2.0, 8.0, 5.0, 6.0, 15.0, 13.0, 14.0, 16.0, 32.0, 33.0, 48.0, 65.0, 110.0, 123.0, 144.0, 108.0, 68.0, 50.0, 33.0, 20.0, 12.0, 11.0, 8.0, 5.0, 6.0, 6.0, 4.0, 4.0, 3.0, 6.0, 4.0, 2.0, 2.0, 0.0, 5.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00505828857421875, -0.004864096641540527, -0.004669904708862305, -0.004475712776184082, -0.004281520843505859, -0.004087328910827637, -0.003893136978149414, -0.0036989450454711914, -0.0035047531127929688, -0.003310561180114746, -0.0031163692474365234, -0.0029221773147583008, -0.002727985382080078, -0.0025337934494018555, -0.002339601516723633, -0.00214540958404541, -0.0019512176513671875, -0.0017570257186889648, -0.0015628337860107422, -0.0013686418533325195, -0.0011744499206542969, -0.0009802579879760742, -0.0007860660552978516, -0.0005918741226196289, -0.00039768218994140625, -0.0002034902572631836, -9.298324584960938e-06, 0.00018489360809326172, 0.0003790855407714844, 0.000573277473449707, 0.0007674694061279297, 0.0009616613388061523, 0.001155853271484375, 0.0013500452041625977, 0.0015442371368408203, 0.001738429069519043, 0.0019326210021972656, 0.0021268129348754883, 0.002321004867553711, 0.0025151968002319336, 0.0027093887329101562, 0.002903580665588379, 0.0030977725982666016, 0.0032919645309448242, 0.003486156463623047, 0.0036803483963012695, 0.003874540328979492, 0.004068732261657715, 0.0042629241943359375, 0.00445711612701416, 0.004651308059692383, 0.0048454999923706055, 0.005039691925048828, 0.005233883857727051, 0.0054280757904052734, 0.005622267723083496, 0.005816459655761719, 0.006010651588439941, 0.006204843521118164, 0.006399035453796387, 0.006593227386474609, 0.006787419319152832, 0.006981611251831055, 0.007175803184509277, 0.0073699951171875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 31.0, 384.0, 513.0, 57.0, 11.0, 6.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27292537689208984, -0.2628140151500702, -0.25270265340805054, -0.2425912618637085, -0.23247990012168884, -0.2223685383796692, -0.21225716173648834, -0.2021457850933075, -0.19203442335128784, -0.1819230616092682, -0.17181168496608734, -0.1617003083229065, -0.15158894658088684, -0.1414775848388672, -0.13136620819568634, -0.12125483900308609, -0.11114346981048584, -0.10103210061788559, -0.09092073142528534, -0.08080936223268509, -0.07069799304008484, -0.06058662384748459, -0.05047525465488434, -0.04036388546228409, -0.030252516269683838, -0.020141147077083588, -0.010029777884483337, 8.159130811691284e-05, 0.010192960500717163, 0.020304329693317413, 0.030415698885917664, 0.040527068078517914, 0.050638437271118164, 0.060749806463718414, 0.07086117565631866, 0.08097254484891891, 0.09108391404151917, 0.10119528323411942, 0.11130665242671967, 0.12141802161931992, 0.13152939081192017, 0.14164075255393982, 0.15175212919712067, 0.1618635058403015, 0.17197486758232117, 0.18208622932434082, 0.19219760596752167, 0.20230898261070251, 0.21242034435272217, 0.22253170609474182, 0.23264308273792267, 0.24275445938110352, 0.25286582112312317, 0.2629771828651428, 0.27308857440948486, 0.2831999361515045, 0.29331129789352417, 0.3034226596355438, 0.3135340213775635, 0.3236454129219055, 0.33375677466392517, 0.3438681364059448, 0.35397952795028687, 0.3640908896923065, 0.37420225143432617]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 7.0, 6.0, 9.0, 8.0, 12.0, 14.0, 20.0, 26.0, 27.0, 28.0, 38.0, 30.0, 46.0, 36.0, 49.0, 51.0, 60.0, 63.0, 56.0, 50.0, 48.0, 53.0, 50.0, 43.0, 36.0, 37.0, 35.0, 16.0, 14.0, 10.0, 7.0, 4.0, 6.0, 6.0, 4.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06178915500640869, -0.05994928628206253, -0.05810941383242607, -0.05626954138278961, -0.05442967265844345, -0.05258980393409729, -0.05074993148446083, -0.04891005903482437, -0.04707019031047821, -0.04523032158613205, -0.04339044913649559, -0.04155057668685913, -0.03971070796251297, -0.03787083923816681, -0.03603096678853035, -0.03419109433889389, -0.03235122561454773, -0.03051135502755642, -0.02867148444056511, -0.0268316138535738, -0.02499174326658249, -0.02315187267959118, -0.02131200209259987, -0.01947213150560856, -0.01763226091861725, -0.01579239033162594, -0.013952519744634628, -0.012112649157643318, -0.010272778570652008, -0.008432907983660698, -0.006593037396669388, -0.004753166809678078, -0.0029132962226867676, -0.0010734256356954575, 0.0007664449512958527, 0.0026063155382871628, 0.004446186125278473, 0.006286056712269783, 0.008125927299261093, 0.009965797886252403, 0.011805668473243713, 0.013645539060235023, 0.015485409647226334, 0.017325280234217644, 0.019165150821208954, 0.021005021408200264, 0.022844891995191574, 0.024684762582182884, 0.026524633169174194, 0.028364503756165504, 0.030204374343156815, 0.032044246792793274, 0.033884115517139435, 0.035723984241485596, 0.037563856691122055, 0.039403729140758514, 0.041243597865104675, 0.043083466589450836, 0.044923339039087296, 0.046763211488723755, 0.048603080213069916, 0.05044294893741608, 0.052282821387052536, 0.054122693836688995, 0.055962562561035156]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 2.0, 5.0, 4.0, 7.0, 13.0, 18.0, 22.0, 23.0, 43.0, 52.0, 98.0, 135.0, 204.0, 350.0, 529.0, 1251.0, 3119.0, 5223.0, 22479.0, 2291070.0, 1836239.0, 24562.0, 4886.0, 1889.0, 748.0, 382.0, 273.0, 193.0, 140.0, 93.0, 55.0, 45.0, 28.0, 23.0, 24.0, 16.0, 16.0, 6.0, 5.0, 2.0, 6.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252838134765625, -0.02449321746826172, -0.023702621459960938, -0.022912025451660156, -0.022121429443359375, -0.021330833435058594, -0.020540237426757812, -0.01974964141845703, -0.01895904541015625, -0.01816844940185547, -0.017377853393554688, -0.016587257385253906, -0.015796661376953125, -0.015006065368652344, -0.014215469360351562, -0.013424873352050781, -0.01263427734375, -0.011843681335449219, -0.011053085327148438, -0.010262489318847656, -0.009471893310546875, -0.008681297302246094, -0.007890701293945312, -0.007100105285644531, -0.00630950927734375, -0.005518913269042969, -0.0047283172607421875, -0.003937721252441406, -0.003147125244140625, -0.0023565292358398438, -0.0015659332275390625, -0.0007753372192382812, 1.52587890625e-05, 0.0008058547973632812, 0.0015964508056640625, 0.0023870468139648438, 0.003177642822265625, 0.003968238830566406, 0.0047588348388671875, 0.005549430847167969, 0.00634002685546875, 0.007130622863769531, 0.007921218872070312, 0.008711814880371094, 0.009502410888671875, 0.010293006896972656, 0.011083602905273438, 0.011874198913574219, 0.012664794921875, 0.013455390930175781, 0.014245986938476562, 0.015036582946777344, 0.015827178955078125, 0.016617774963378906, 0.017408370971679688, 0.01819896697998047, 0.01898956298828125, 0.01978015899658203, 0.020570755004882812, 0.021361351013183594, 0.022151947021484375, 0.022942543029785156, 0.023733139038085938, 0.02452373504638672, 0.0253143310546875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 38.0, 105.0, 187.0, 244.0, 225.0, 129.0, 41.0, 15.0, 4.0, 6.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.018463134765625, -0.01784038543701172, -0.017217636108398438, -0.016594886779785156, -0.015972137451171875, -0.015349388122558594, -0.014726638793945312, -0.014103889465332031, -0.01348114013671875, -0.012858390808105469, -0.012235641479492188, -0.011612892150878906, -0.010990142822265625, -0.010367393493652344, -0.009744644165039062, -0.009121894836425781, -0.0084991455078125, -0.007876396179199219, -0.0072536468505859375, -0.006630897521972656, -0.006008148193359375, -0.005385398864746094, -0.0047626495361328125, -0.004139900207519531, -0.00351715087890625, -0.0028944015502929688, -0.0022716522216796875, -0.0016489028930664062, -0.001026153564453125, -0.00040340423583984375, 0.0002193450927734375, 0.0008420944213867188, 0.00146484375, 0.0020875930786132812, 0.0027103424072265625, 0.0033330917358398438, 0.003955841064453125, 0.004578590393066406, 0.0052013397216796875, 0.005824089050292969, 0.00644683837890625, 0.007069587707519531, 0.0076923370361328125, 0.008315086364746094, 0.008937835693359375, 0.009560585021972656, 0.010183334350585938, 0.010806083679199219, 0.0114288330078125, 0.012051582336425781, 0.012674331665039062, 0.013297080993652344, 0.013919830322265625, 0.014542579650878906, 0.015165328979492188, 0.01578807830810547, 0.01641082763671875, 0.01703357696533203, 0.017656326293945312, 0.018279075622558594, 0.018901824951171875, 0.019524574279785156, 0.020147323608398438, 0.02077007293701172, 0.021392822265625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 4.0, 5.0, 6.0, 14.0, 16.0, 9.0, 21.0, 36.0, 49.0, 87.0, 159.0, 282.0, 735.0, 2084.0, 9501.0, 116151.0, 3898505.0, 151940.0, 10989.0, 2273.0, 733.0, 288.0, 148.0, 88.0, 61.0, 38.0, 15.0, 16.0, 9.0, 3.0, 6.0, 3.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0237884521484375, -0.023034095764160156, -0.022279739379882812, -0.02152538299560547, -0.020771026611328125, -0.02001667022705078, -0.019262313842773438, -0.018507957458496094, -0.01775360107421875, -0.016999244689941406, -0.016244888305664062, -0.015490531921386719, -0.014736175537109375, -0.013981819152832031, -0.013227462768554688, -0.012473106384277344, -0.01171875, -0.010964393615722656, -0.010210037231445312, -0.009455680847167969, -0.008701324462890625, -0.007946968078613281, -0.0071926116943359375, -0.006438255310058594, -0.00568389892578125, -0.004929542541503906, -0.0041751861572265625, -0.0034208297729492188, -0.002666473388671875, -0.0019121170043945312, -0.0011577606201171875, -0.00040340423583984375, 0.0003509521484375, 0.0011053085327148438, 0.0018596649169921875, 0.0026140213012695312, 0.003368377685546875, 0.004122734069824219, 0.0048770904541015625, 0.005631446838378906, 0.00638580322265625, 0.007140159606933594, 0.007894515991210938, 0.008648872375488281, 0.009403228759765625, 0.010157585144042969, 0.010911941528320312, 0.011666297912597656, 0.012420654296875, 0.013175010681152344, 0.013929367065429688, 0.014683723449707031, 0.015438079833984375, 0.01619243621826172, 0.016946792602539062, 0.017701148986816406, 0.01845550537109375, 0.019209861755371094, 0.019964218139648438, 0.02071857452392578, 0.021472930908203125, 0.02222728729248047, 0.022981643676757812, 0.023736000061035156, 0.0244903564453125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 9.0, 10.0, 13.0, 24.0, 13.0, 26.0, 36.0, 49.0, 68.0, 90.0, 123.0, 248.0, 436.0, 807.0, 734.0, 499.0, 270.0, 166.0, 115.0, 80.0, 77.0, 34.0, 31.0, 23.0, 26.0, 12.0, 13.0, 10.0, 3.0, 9.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.00994873046875, -0.009656786918640137, -0.009364843368530273, -0.00907289981842041, -0.008780956268310547, -0.008489012718200684, -0.00819706916809082, -0.007905125617980957, -0.007613182067871094, -0.0073212385177612305, -0.007029294967651367, -0.006737351417541504, -0.006445407867431641, -0.006153464317321777, -0.005861520767211914, -0.005569577217102051, -0.0052776336669921875, -0.004985690116882324, -0.004693746566772461, -0.004401803016662598, -0.004109859466552734, -0.003817915916442871, -0.003525972366333008, -0.0032340288162231445, -0.0029420852661132812, -0.002650141716003418, -0.0023581981658935547, -0.0020662546157836914, -0.0017743110656738281, -0.0014823675155639648, -0.0011904239654541016, -0.0008984804153442383, -0.000606536865234375, -0.0003145933151245117, -2.2649765014648438e-05, 0.00026929378509521484, 0.0005612373352050781, 0.0008531808853149414, 0.0011451244354248047, 0.001437067985534668, 0.0017290115356445312, 0.0020209550857543945, 0.002312898635864258, 0.002604842185974121, 0.0028967857360839844, 0.0031887292861938477, 0.003480672836303711, 0.0037726163864135742, 0.0040645599365234375, 0.004356503486633301, 0.004648447036743164, 0.004940390586853027, 0.005232334136962891, 0.005524277687072754, 0.005816221237182617, 0.0061081647872924805, 0.006400108337402344, 0.006692051887512207, 0.00698399543762207, 0.007275938987731934, 0.007567882537841797, 0.00785982608795166, 0.008151769638061523, 0.008443713188171387, 0.00873565673828125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 12.0, 35.0, 219.0, 453.0, 227.0, 41.0, 4.0, 4.0, 4.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.1722070723772049, -0.16772635281085968, -0.16324561834335327, -0.15876489877700806, -0.15428416430950165, -0.14980344474315643, -0.14532271027565002, -0.1408419907093048, -0.1363612711429596, -0.13188055157661438, -0.12739981710910797, -0.12291909009218216, -0.11843836307525635, -0.11395764350891113, -0.10947691649198532, -0.10499618947505951, -0.1005154550075531, -0.09603472799062729, -0.09155400097370148, -0.08707327395677567, -0.08259254693984985, -0.07811182737350464, -0.07363110035657883, -0.06915037333965302, -0.0646696463227272, -0.06018891930580139, -0.05570819228887558, -0.051227468997240067, -0.046746741980314255, -0.04226601496338844, -0.03778529167175293, -0.03330456465482712, -0.028823837637901306, -0.024343110620975494, -0.019862385466694832, -0.015381659381091595, -0.010900933295488358, -0.006420206278562546, -0.0019394811242818832, 0.0025412440299987793, 0.007021971046924591, 0.011502697132527828, 0.015983423218131065, 0.020464148372411728, 0.02494487538933754, 0.02942560240626335, 0.033906325697898865, 0.038387052714824677, 0.04286777973175049, 0.0473485067486763, 0.05182923376560211, 0.056309957057237625, 0.06079068407416344, 0.06527140736579895, 0.06975213438272476, 0.07423286139965057, 0.07871358841657639, 0.0831943154335022, 0.08767504245042801, 0.09215576946735382, 0.09663648903369904, 0.10111722350120544, 0.10559794306755066, 0.11007867008447647, 0.11455939710140228]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 7.0, 11.0, 17.0, 24.0, 34.0, 33.0, 62.0, 44.0, 58.0, 68.0, 63.0, 61.0, 72.0, 78.0, 50.0, 58.0, 50.0, 43.0, 31.0, 28.0, 29.0, 15.0, 23.0, 8.0, 11.0, 8.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0522761344909668, -0.05100224167108536, -0.04972834885120392, -0.04845445230603218, -0.04718055948615074, -0.0459066666662693, -0.044632770121097565, -0.043358877301216125, -0.042084984481334686, -0.04081109166145325, -0.03953719884157181, -0.03826330229640007, -0.03698940947651863, -0.03571551665663719, -0.034441620111465454, -0.033167727291584015, -0.031893834471702576, -0.030619941651821136, -0.029346046969294548, -0.02807215228676796, -0.02679825946688652, -0.02552436664700508, -0.024250471964478493, -0.022976577281951904, -0.021702684462070465, -0.020428791642189026, -0.019154896959662437, -0.01788100227713585, -0.01660710945725441, -0.015333215706050396, -0.014059321954846382, -0.012785428203642368, -0.011511534452438354, -0.01023764070123434, -0.008963746950030327, -0.007689853198826313, -0.006415959447622299, -0.005142065696418285, -0.0038681719452142715, -0.0025942781940102577, -0.001320384442806244, -4.649069160223007e-05, 0.0012274030596017838, 0.0025012968108057976, 0.0037751905620098114, 0.005049084313213825, 0.006322978064417839, 0.007596871815621853, 0.008870765566825867, 0.01014465931802988, 0.011418553069233894, 0.012692446820437908, 0.013966340571641922, 0.015240234322845936, 0.01651412807404995, 0.017788022756576538, 0.019061915576457977, 0.020335808396339417, 0.021609703078866005, 0.022883597761392593, 0.024157490581274033, 0.025431383401155472, 0.02670527808368206, 0.02797917276620865, 0.029253065586090088]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 5.0, 9.0, 10.0, 21.0, 11.0, 29.0, 17.0, 38.0, 53.0, 49.0, 87.0, 106.0, 156.0, 193.0, 292.0, 431.0, 834.0, 1953.0, 9212.0, 259234.0, 750668.0, 19416.0, 2860.0, 1100.0, 568.0, 345.0, 224.0, 145.0, 123.0, 107.0, 70.0, 53.0, 30.0, 26.0, 21.0, 11.0, 11.0, 11.0, 10.0, 4.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.037200927734375, -0.036006927490234375, -0.03481292724609375, -0.033618927001953125, -0.0324249267578125, -0.031230926513671875, -0.03003692626953125, -0.028842926025390625, -0.02764892578125, -0.026454925537109375, -0.02526092529296875, -0.024066925048828125, -0.0228729248046875, -0.021678924560546875, -0.02048492431640625, -0.019290924072265625, -0.018096923828125, -0.016902923583984375, -0.01570892333984375, -0.014514923095703125, -0.0133209228515625, -0.012126922607421875, -0.01093292236328125, -0.009738922119140625, -0.008544921875, -0.007350921630859375, -0.00615692138671875, -0.004962921142578125, -0.0037689208984375, -0.002574920654296875, -0.00138092041015625, -0.000186920166015625, 0.001007080078125, 0.002201080322265625, 0.00339508056640625, 0.004589080810546875, 0.0057830810546875, 0.006977081298828125, 0.00817108154296875, 0.009365081787109375, 0.01055908203125, 0.011753082275390625, 0.01294708251953125, 0.014141082763671875, 0.0153350830078125, 0.016529083251953125, 0.01772308349609375, 0.018917083740234375, 0.020111083984375, 0.021305084228515625, 0.02249908447265625, 0.023693084716796875, 0.0248870849609375, 0.026081085205078125, 0.02727508544921875, 0.028469085693359375, 0.0296630859375, 0.030857086181640625, 0.03205108642578125, 0.033245086669921875, 0.0344390869140625, 0.035633087158203125, 0.03682708740234375, 0.038021087646484375, 0.039215087890625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 26.0, 81.0, 176.0, 244.0, 228.0, 158.0, 55.0, 18.0, 8.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0180511474609375, -0.01742696762084961, -0.01680278778076172, -0.016178607940673828, -0.015554428100585938, -0.014930248260498047, -0.014306068420410156, -0.013681888580322266, -0.013057708740234375, -0.012433528900146484, -0.011809349060058594, -0.011185169219970703, -0.010560989379882812, -0.009936809539794922, -0.009312629699707031, -0.00868844985961914, -0.00806427001953125, -0.007440090179443359, -0.006815910339355469, -0.006191730499267578, -0.0055675506591796875, -0.004943370819091797, -0.004319190979003906, -0.0036950111389160156, -0.003070831298828125, -0.0024466514587402344, -0.0018224716186523438, -0.0011982917785644531, -0.0005741119384765625, 5.0067901611328125e-05, 0.0006742477416992188, 0.0012984275817871094, 0.001922607421875, 0.0025467872619628906, 0.0031709671020507812, 0.003795146942138672, 0.0044193267822265625, 0.005043506622314453, 0.005667686462402344, 0.006291866302490234, 0.006916046142578125, 0.007540225982666016, 0.008164405822753906, 0.008788585662841797, 0.009412765502929688, 0.010036945343017578, 0.010661125183105469, 0.01128530502319336, 0.01190948486328125, 0.01253366470336914, 0.013157844543457031, 0.013782024383544922, 0.014406204223632812, 0.015030384063720703, 0.015654563903808594, 0.016278743743896484, 0.016902923583984375, 0.017527103424072266, 0.018151283264160156, 0.018775463104248047, 0.019399642944335938, 0.020023822784423828, 0.02064800262451172, 0.02127218246459961, 0.0218963623046875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 3.0, 10.0, 7.0, 13.0, 20.0, 38.0, 50.0, 51.0, 74.0, 137.0, 235.0, 368.0, 815.0, 2529.0, 13518.0, 267276.0, 723911.0, 32824.0, 4256.0, 1182.0, 503.0, 273.0, 158.0, 103.0, 69.0, 39.0, 26.0, 15.0, 9.0, 10.0, 8.0, 2.0, 7.0, 7.0, 5.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0307464599609375, -0.02979111671447754, -0.028835773468017578, -0.027880430221557617, -0.026925086975097656, -0.025969743728637695, -0.025014400482177734, -0.024059057235717773, -0.023103713989257812, -0.02214837074279785, -0.02119302749633789, -0.02023768424987793, -0.01928234100341797, -0.018326997756958008, -0.017371654510498047, -0.016416311264038086, -0.015460968017578125, -0.014505624771118164, -0.013550281524658203, -0.012594938278198242, -0.011639595031738281, -0.01068425178527832, -0.00972890853881836, -0.008773565292358398, -0.007818222045898438, -0.0068628787994384766, -0.005907535552978516, -0.004952192306518555, -0.003996849060058594, -0.003041505813598633, -0.002086162567138672, -0.001130819320678711, -0.00017547607421875, 0.0007798671722412109, 0.0017352104187011719, 0.002690553665161133, 0.0036458969116210938, 0.004601240158081055, 0.005556583404541016, 0.0065119266510009766, 0.0074672698974609375, 0.008422613143920898, 0.00937795639038086, 0.01033329963684082, 0.011288642883300781, 0.012243986129760742, 0.013199329376220703, 0.014154672622680664, 0.015110015869140625, 0.016065359115600586, 0.017020702362060547, 0.017976045608520508, 0.01893138885498047, 0.01988673210144043, 0.02084207534790039, 0.02179741859436035, 0.022752761840820312, 0.023708105087280273, 0.024663448333740234, 0.025618791580200195, 0.026574134826660156, 0.027529478073120117, 0.028484821319580078, 0.02944016456604004, 0.0303955078125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 3.0, 6.0, 2.0, 12.0, 8.0, 11.0, 8.0, 20.0, 22.0, 18.0, 23.0, 29.0, 31.0, 34.0, 51.0, 41.0, 45.0, 63.0, 43.0, 48.0, 50.0, 46.0, 42.0, 45.0, 43.0, 43.0, 41.0, 24.0, 26.0, 16.0, 17.0, 19.0, 16.0, 19.0, 7.0, 8.0, 8.0, 7.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01168060302734375, -0.011255979537963867, -0.010831356048583984, -0.010406732559204102, -0.009982109069824219, -0.009557485580444336, -0.009132862091064453, -0.00870823860168457, -0.008283615112304688, -0.007858991622924805, -0.007434368133544922, -0.007009744644165039, -0.006585121154785156, -0.0061604976654052734, -0.005735874176025391, -0.005311250686645508, -0.004886627197265625, -0.004462003707885742, -0.004037380218505859, -0.0036127567291259766, -0.0031881332397460938, -0.002763509750366211, -0.002338886260986328, -0.0019142627716064453, -0.0014896392822265625, -0.0010650157928466797, -0.0006403923034667969, -0.00021576881408691406, 0.00020885467529296875, 0.0006334781646728516, 0.0010581016540527344, 0.0014827251434326172, 0.0019073486328125, 0.002331972122192383, 0.0027565956115722656, 0.0031812191009521484, 0.0036058425903320312, 0.004030466079711914, 0.004455089569091797, 0.00487971305847168, 0.0053043365478515625, 0.005728960037231445, 0.006153583526611328, 0.006578207015991211, 0.007002830505371094, 0.0074274539947509766, 0.00785207748413086, 0.008276700973510742, 0.008701324462890625, 0.009125947952270508, 0.00955057144165039, 0.009975194931030273, 0.010399818420410156, 0.010824441909790039, 0.011249065399169922, 0.011673688888549805, 0.012098312377929688, 0.01252293586730957, 0.012947559356689453, 0.013372182846069336, 0.013796806335449219, 0.014221429824829102, 0.014646053314208984, 0.015070676803588867, 0.01549530029296875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 9.0, 11.0, 13.0, 21.0, 37.0, 38.0, 69.0, 102.0, 160.0, 311.0, 648.0, 1531.0, 4150.0, 14669.0, 86075.0, 706493.0, 199230.0, 24902.0, 6343.0, 1991.0, 813.0, 367.0, 202.0, 107.0, 78.0, 61.0, 26.0, 22.0, 21.0, 14.0, 9.0, 9.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007602691650390625, -0.007346451282501221, -0.007090210914611816, -0.006833970546722412, -0.006577730178833008, -0.0063214898109436035, -0.006065249443054199, -0.005809009075164795, -0.005552768707275391, -0.005296528339385986, -0.005040287971496582, -0.004784047603607178, -0.0045278072357177734, -0.004271566867828369, -0.004015326499938965, -0.0037590861320495605, -0.0035028457641601562, -0.003246605396270752, -0.0029903650283813477, -0.0027341246604919434, -0.002477884292602539, -0.0022216439247131348, -0.0019654035568237305, -0.0017091631889343262, -0.0014529228210449219, -0.0011966824531555176, -0.0009404420852661133, -0.000684201717376709, -0.0004279613494873047, -0.0001717209815979004, 8.45193862915039e-05, 0.0003407597541809082, 0.0005970001220703125, 0.0008532404899597168, 0.001109480857849121, 0.0013657212257385254, 0.0016219615936279297, 0.001878201961517334, 0.0021344423294067383, 0.0023906826972961426, 0.002646923065185547, 0.002903163433074951, 0.0031594038009643555, 0.0034156441688537598, 0.003671884536743164, 0.003928124904632568, 0.004184365272521973, 0.004440605640411377, 0.004696846008300781, 0.0049530863761901855, 0.00520932674407959, 0.005465567111968994, 0.0057218074798583984, 0.005978047847747803, 0.006234288215637207, 0.006490528583526611, 0.006746768951416016, 0.00700300931930542, 0.007259249687194824, 0.0075154900550842285, 0.007771730422973633, 0.008027970790863037, 0.008284211158752441, 0.008540451526641846, 0.00879669189453125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 4.0, 5.0, 3.0, 7.0, 10.0, 10.0, 7.0, 9.0, 11.0, 20.0, 16.0, 22.0, 18.0, 30.0, 31.0, 33.0, 48.0, 49.0, 64.0, 62.0, 78.0, 56.0, 58.0, 53.0, 45.0, 32.0, 31.0, 26.0, 24.0, 23.0, 23.0, 18.0, 20.0, 8.0, 12.0, 6.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-4.786252975463867e-05, -4.6232715249061584e-05, -4.46029007434845e-05, -4.297308623790741e-05, -4.134327173233032e-05, -3.9713457226753235e-05, -3.808364272117615e-05, -3.645382821559906e-05, -3.482401371002197e-05, -3.3194199204444885e-05, -3.15643846988678e-05, -2.993457019329071e-05, -2.8304755687713623e-05, -2.6674941182136536e-05, -2.5045126676559448e-05, -2.341531217098236e-05, -2.1785497665405273e-05, -2.0155683159828186e-05, -1.85258686542511e-05, -1.689605414867401e-05, -1.5266239643096924e-05, -1.3636425137519836e-05, -1.2006610631942749e-05, -1.0376796126365662e-05, -8.746981620788574e-06, -7.117167115211487e-06, -5.487352609634399e-06, -3.857538104057312e-06, -2.2277235984802246e-06, -5.979090929031372e-07, 1.0319054126739502e-06, 2.6617199182510376e-06, 4.291534423828125e-06, 5.921348929405212e-06, 7.5511634349823e-06, 9.180977940559387e-06, 1.0810792446136475e-05, 1.2440606951713562e-05, 1.407042145729065e-05, 1.5700235962867737e-05, 1.7330050468444824e-05, 1.895986497402191e-05, 2.0589679479599e-05, 2.2219493985176086e-05, 2.3849308490753174e-05, 2.547912299633026e-05, 2.710893750190735e-05, 2.8738752007484436e-05, 3.0368566513061523e-05, 3.199838101863861e-05, 3.36281955242157e-05, 3.5258010029792786e-05, 3.688782453536987e-05, 3.851763904094696e-05, 4.014745354652405e-05, 4.1777268052101135e-05, 4.340708255767822e-05, 4.503689706325531e-05, 4.66667115688324e-05, 4.8296526074409485e-05, 4.992634057998657e-05, 5.155615508556366e-05, 5.318596959114075e-05, 5.4815784096717834e-05, 5.644559860229492e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 8.0, 5.0, 4.0, 9.0, 12.0, 18.0, 17.0, 20.0, 33.0, 55.0, 66.0, 130.0, 231.0, 446.0, 953.0, 2507.0, 7605.0, 34361.0, 372961.0, 565636.0, 48406.0, 9755.0, 3044.0, 1103.0, 491.0, 227.0, 148.0, 84.0, 59.0, 35.0, 32.0, 22.0, 17.0, 6.0, 10.0, 10.0, 4.0, 5.0, 5.0, 1.0, 4.0, 5.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00797271728515625, -0.007698655128479004, -0.007424592971801758, -0.007150530815124512, -0.006876468658447266, -0.0066024065017700195, -0.0063283443450927734, -0.006054282188415527, -0.005780220031738281, -0.005506157875061035, -0.005232095718383789, -0.004958033561706543, -0.004683971405029297, -0.004409909248352051, -0.004135847091674805, -0.0038617849349975586, -0.0035877227783203125, -0.0033136606216430664, -0.0030395984649658203, -0.0027655363082885742, -0.002491474151611328, -0.002217411994934082, -0.001943349838256836, -0.0016692876815795898, -0.0013952255249023438, -0.0011211633682250977, -0.0008471012115478516, -0.0005730390548706055, -0.0002989768981933594, -2.491474151611328e-05, 0.0002491474151611328, 0.0005232095718383789, 0.000797271728515625, 0.001071333885192871, 0.0013453960418701172, 0.0016194581985473633, 0.0018935203552246094, 0.0021675825119018555, 0.0024416446685791016, 0.0027157068252563477, 0.0029897689819335938, 0.00326383113861084, 0.003537893295288086, 0.003811955451965332, 0.004086017608642578, 0.004360079765319824, 0.00463414192199707, 0.004908204078674316, 0.0051822662353515625, 0.005456328392028809, 0.005730390548706055, 0.006004452705383301, 0.006278514862060547, 0.006552577018737793, 0.006826639175415039, 0.007100701332092285, 0.007374763488769531, 0.007648825645446777, 0.007922887802124023, 0.00819694995880127, 0.008471012115478516, 0.008745074272155762, 0.009019136428833008, 0.009293198585510254, 0.0095672607421875]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 6.0, 4.0, 6.0, 8.0, 6.0, 10.0, 12.0, 18.0, 17.0, 26.0, 33.0, 35.0, 56.0, 62.0, 66.0, 91.0, 74.0, 89.0, 70.0, 69.0, 51.0, 43.0, 24.0, 30.0, 21.0, 15.0, 14.0, 11.0, 11.0, 2.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00440216064453125, -0.004266858100891113, -0.0041315555572509766, -0.00399625301361084, -0.003860950469970703, -0.0037256479263305664, -0.0035903453826904297, -0.003455042839050293, -0.0033197402954101562, -0.0031844377517700195, -0.003049135208129883, -0.002913832664489746, -0.0027785301208496094, -0.0026432275772094727, -0.002507925033569336, -0.0023726224899291992, -0.0022373199462890625, -0.0021020174026489258, -0.001966714859008789, -0.0018314123153686523, -0.0016961097717285156, -0.001560807228088379, -0.0014255046844482422, -0.0012902021408081055, -0.0011548995971679688, -0.001019597053527832, -0.0008842945098876953, -0.0007489919662475586, -0.0006136894226074219, -0.00047838687896728516, -0.00034308433532714844, -0.00020778179168701172, -7.2479248046875e-05, 6.282329559326172e-05, 0.00019812583923339844, 0.00033342838287353516, 0.0004687309265136719, 0.0006040334701538086, 0.0007393360137939453, 0.000874638557434082, 0.0010099411010742188, 0.0011452436447143555, 0.0012805461883544922, 0.001415848731994629, 0.0015511512756347656, 0.0016864538192749023, 0.001821756362915039, 0.0019570589065551758, 0.0020923614501953125, 0.0022276639938354492, 0.002362966537475586, 0.0024982690811157227, 0.0026335716247558594, 0.002768874168395996, 0.002904176712036133, 0.0030394792556762695, 0.0031747817993164062, 0.003310084342956543, 0.0034453868865966797, 0.0035806894302368164, 0.003715991973876953, 0.00385129451751709, 0.0039865970611572266, 0.004121899604797363, 0.0042572021484375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 51.0, 895.0, 59.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13441069424152374, -0.11848713457584381, -0.10256357491016388, -0.08664000779390335, -0.07071644812822342, -0.05479288846254349, -0.03886932134628296, -0.022945761680603027, -0.007022202014923096, 0.008901359513401985, 0.024824921041727066, 0.040748484432697296, 0.05667204409837723, 0.07259560376405716, 0.08851917088031769, 0.10444273054599762, 0.12036629021167755, 0.13628984987735748, 0.15221340954303741, 0.16813698410987854, 0.18406054377555847, 0.1999841034412384, 0.21590766310691833, 0.23183122277259827, 0.2477547824382782, 0.26367834210395813, 0.27960190176963806, 0.295525461435318, 0.3114490211009979, 0.32737258076667786, 0.3432961702346802, 0.3592197299003601, 0.37514322996139526, 0.3910667896270752, 0.4069903492927551, 0.42291390895843506, 0.438837468624115, 0.4547610282897949, 0.47068458795547485, 0.4866081476211548, 0.5025317072868347, 0.5184552669525146, 0.5343788266181946, 0.5503023862838745, 0.5662259459495544, 0.5821495056152344, 0.5980730652809143, 0.6139966249465942, 0.629920244216919, 0.6458438038825989, 0.6617673635482788, 0.6776909232139587, 0.6936144828796387, 0.7095380425453186, 0.7254616022109985, 0.7413851618766785, 0.7573087215423584, 0.7732322812080383, 0.7891558408737183, 0.8050794005393982, 0.8210029602050781, 0.8369265198707581, 0.852850079536438, 0.8687736392021179, 0.8846971988677979]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 7.0, 3.0, 9.0, 12.0, 8.0, 13.0, 11.0, 16.0, 21.0, 23.0, 20.0, 30.0, 31.0, 44.0, 27.0, 47.0, 37.0, 44.0, 40.0, 40.0, 40.0, 57.0, 43.0, 37.0, 30.0, 45.0, 22.0, 45.0, 27.0, 18.0, 28.0, 16.0, 15.0, 20.0, 12.0, 16.0, 9.0, 6.0, 5.0, 7.0, 10.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.04222053289413452, -0.04105687886476517, -0.03989322483539581, -0.03872957080602646, -0.037565916776657104, -0.03640226274728775, -0.035238608717918396, -0.03407495468854904, -0.03291130065917969, -0.03174764662981033, -0.03058399260044098, -0.029420338571071625, -0.02825668454170227, -0.027093030512332916, -0.025929376482963562, -0.024765722453594208, -0.023602068424224854, -0.0224384143948555, -0.021274760365486145, -0.02011110633611679, -0.018947452306747437, -0.017783798277378082, -0.016620144248008728, -0.015456490218639374, -0.01429283618927002, -0.013129182159900665, -0.011965528130531311, -0.010801874101161957, -0.009638220071792603, -0.008474566042423248, -0.007310912013053894, -0.00614725798368454, -0.0049836039543151855, -0.0038199499249458313, -0.002656295895576477, -0.0014926418662071228, -0.00032898783683776855, 0.0008346661925315857, 0.00199832022190094, 0.003161974251270294, 0.0043256282806396484, 0.005489282310009003, 0.006652936339378357, 0.007816590368747711, 0.008980244398117065, 0.01014389842748642, 0.011307552456855774, 0.012471206486225128, 0.013634860515594482, 0.014798514544963837, 0.01596216857433319, 0.017125822603702545, 0.0182894766330719, 0.019453130662441254, 0.020616784691810608, 0.021780438721179962, 0.022944092750549316, 0.02410774677991867, 0.025271400809288025, 0.02643505483865738, 0.027598708868026733, 0.028762362897396088, 0.029926016926765442, 0.031089670956134796, 0.03225332498550415]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 7.0, 4.0, 11.0, 4.0, 9.0, 13.0, 16.0, 24.0, 40.0, 44.0, 60.0, 83.0, 110.0, 154.0, 212.0, 349.0, 555.0, 1054.0, 2834.0, 5660.0, 21859.0, 1716014.0, 2406170.0, 28828.0, 5905.0, 1959.0, 761.0, 424.0, 284.0, 203.0, 158.0, 116.0, 77.0, 59.0, 47.0, 40.0, 29.0, 20.0, 20.0, 13.0, 13.0, 7.0, 9.0, 11.0, 1.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.023162841796875, -0.02236485481262207, -0.02156686782836914, -0.02076888084411621, -0.01997089385986328, -0.01917290687561035, -0.018374919891357422, -0.017576932907104492, -0.016778945922851562, -0.015980958938598633, -0.015182971954345703, -0.014384984970092773, -0.013586997985839844, -0.012789011001586914, -0.011991024017333984, -0.011193037033081055, -0.010395050048828125, -0.009597063064575195, -0.008799076080322266, -0.008001089096069336, -0.007203102111816406, -0.0064051151275634766, -0.005607128143310547, -0.004809141159057617, -0.0040111541748046875, -0.003213167190551758, -0.002415180206298828, -0.0016171932220458984, -0.0008192062377929688, -2.1219253540039062e-05, 0.0007767677307128906, 0.0015747547149658203, 0.00237274169921875, 0.0031707286834716797, 0.003968715667724609, 0.004766702651977539, 0.005564689636230469, 0.0063626766204833984, 0.007160663604736328, 0.007958650588989258, 0.008756637573242188, 0.009554624557495117, 0.010352611541748047, 0.011150598526000977, 0.011948585510253906, 0.012746572494506836, 0.013544559478759766, 0.014342546463012695, 0.015140533447265625, 0.015938520431518555, 0.016736507415771484, 0.017534494400024414, 0.018332481384277344, 0.019130468368530273, 0.019928455352783203, 0.020726442337036133, 0.021524429321289062, 0.022322416305541992, 0.023120403289794922, 0.02391839027404785, 0.02471637725830078, 0.02551436424255371, 0.02631235122680664, 0.02711033821105957, 0.0279083251953125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 11.0, 39.0, 95.0, 195.0, 209.0, 226.0, 143.0, 51.0, 18.0, 8.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0177154541015625, -0.017119646072387695, -0.01652383804321289, -0.015928030014038086, -0.015332221984863281, -0.014736413955688477, -0.014140605926513672, -0.013544797897338867, -0.012948989868164062, -0.012353181838989258, -0.011757373809814453, -0.011161565780639648, -0.010565757751464844, -0.009969949722290039, -0.009374141693115234, -0.00877833366394043, -0.008182525634765625, -0.00758671760559082, -0.006990909576416016, -0.006395101547241211, -0.005799293518066406, -0.0052034854888916016, -0.004607677459716797, -0.004011869430541992, -0.0034160614013671875, -0.002820253372192383, -0.002224445343017578, -0.0016286373138427734, -0.0010328292846679688, -0.00043702125549316406, 0.00015878677368164062, 0.0007545948028564453, 0.00135040283203125, 0.0019462108612060547, 0.0025420188903808594, 0.003137826919555664, 0.0037336349487304688, 0.0043294429779052734, 0.004925251007080078, 0.005521059036254883, 0.0061168670654296875, 0.006712675094604492, 0.007308483123779297, 0.007904291152954102, 0.008500099182128906, 0.009095907211303711, 0.009691715240478516, 0.01028752326965332, 0.010883331298828125, 0.01147913932800293, 0.012074947357177734, 0.012670755386352539, 0.013266563415527344, 0.013862371444702148, 0.014458179473876953, 0.015053987503051758, 0.015649795532226562, 0.016245603561401367, 0.016841411590576172, 0.017437219619750977, 0.01803302764892578, 0.018628835678100586, 0.01922464370727539, 0.019820451736450195, 0.020416259765625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 11.0, 17.0, 15.0, 24.0, 40.0, 91.0, 129.0, 257.0, 463.0, 944.0, 2120.0, 5955.0, 26025.0, 327979.0, 3661258.0, 144366.0, 16572.0, 4587.0, 1749.0, 782.0, 391.0, 213.0, 96.0, 69.0, 41.0, 30.0, 15.0, 11.0, 13.0, 5.0, 2.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0186004638671875, -0.018043041229248047, -0.017485618591308594, -0.01692819595336914, -0.016370773315429688, -0.015813350677490234, -0.015255928039550781, -0.014698505401611328, -0.014141082763671875, -0.013583660125732422, -0.013026237487792969, -0.012468814849853516, -0.011911392211914062, -0.01135396957397461, -0.010796546936035156, -0.010239124298095703, -0.00968170166015625, -0.009124279022216797, -0.008566856384277344, -0.00800943374633789, -0.0074520111083984375, -0.006894588470458984, -0.006337165832519531, -0.005779743194580078, -0.005222320556640625, -0.004664897918701172, -0.004107475280761719, -0.0035500526428222656, -0.0029926300048828125, -0.0024352073669433594, -0.0018777847290039062, -0.0013203620910644531, -0.000762939453125, -0.00020551681518554688, 0.00035190582275390625, 0.0009093284606933594, 0.0014667510986328125, 0.0020241737365722656, 0.0025815963745117188, 0.003139019012451172, 0.003696441650390625, 0.004253864288330078, 0.004811286926269531, 0.005368709564208984, 0.0059261322021484375, 0.006483554840087891, 0.007040977478027344, 0.007598400115966797, 0.00815582275390625, 0.008713245391845703, 0.009270668029785156, 0.00982809066772461, 0.010385513305664062, 0.010942935943603516, 0.011500358581542969, 0.012057781219482422, 0.012615203857421875, 0.013172626495361328, 0.013730049133300781, 0.014287471771240234, 0.014844894409179688, 0.01540231704711914, 0.015959739685058594, 0.016517162322998047, 0.0170745849609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 9.0, 3.0, 10.0, 11.0, 19.0, 46.0, 52.0, 108.0, 227.0, 526.0, 1147.0, 981.0, 372.0, 195.0, 131.0, 80.0, 45.0, 36.0, 25.0, 14.0, 10.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0109405517578125, -0.01049947738647461, -0.010058403015136719, -0.009617328643798828, -0.009176254272460938, -0.008735179901123047, -0.008294105529785156, -0.007853031158447266, -0.007411956787109375, -0.006970882415771484, -0.006529808044433594, -0.006088733673095703, -0.0056476593017578125, -0.005206584930419922, -0.004765510559082031, -0.004324436187744141, -0.00388336181640625, -0.0034422874450683594, -0.0030012130737304688, -0.002560138702392578, -0.0021190643310546875, -0.0016779899597167969, -0.0012369155883789062, -0.0007958412170410156, -0.000354766845703125, 8.630752563476562e-05, 0.0005273818969726562, 0.0009684562683105469, 0.0014095306396484375, 0.0018506050109863281, 0.0022916793823242188, 0.0027327537536621094, 0.003173828125, 0.0036149024963378906, 0.004055976867675781, 0.004497051239013672, 0.0049381256103515625, 0.005379199981689453, 0.005820274353027344, 0.006261348724365234, 0.006702423095703125, 0.007143497467041016, 0.007584571838378906, 0.008025646209716797, 0.008466720581054688, 0.008907794952392578, 0.009348869323730469, 0.00978994369506836, 0.01023101806640625, 0.01067209243774414, 0.011113166809082031, 0.011554241180419922, 0.011995315551757812, 0.012436389923095703, 0.012877464294433594, 0.013318538665771484, 0.013759613037109375, 0.014200687408447266, 0.014641761779785156, 0.015082836151123047, 0.015523910522460938, 0.015964984893798828, 0.01640605926513672, 0.01684713363647461, 0.0172882080078125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 30.0, 635.0, 305.0, 25.0, 11.0, 1.0, 1.0, 1.0, 2.0, 3.0], "bins": [-0.5228489637374878, -0.5134583711624146, -0.5040677785873413, -0.4946771562099457, -0.48528656363487244, -0.4758959710597992, -0.46650537848472595, -0.4571147859096527, -0.4477241635322571, -0.43833357095718384, -0.4289429783821106, -0.41955235600471497, -0.4101617634296417, -0.4007711708545685, -0.39138057827949524, -0.381989985704422, -0.37259939312934875, -0.3632088005542755, -0.35381820797920227, -0.34442758560180664, -0.3350369930267334, -0.32564640045166016, -0.3162558078765869, -0.30686521530151367, -0.29747462272644043, -0.2880840301513672, -0.27869343757629395, -0.2693028151988983, -0.2599122226238251, -0.25052163004875183, -0.2411310374736786, -0.23174044489860535, -0.22234980762004852, -0.21295921504497528, -0.20356860756874084, -0.1941780149936676, -0.18478742241859436, -0.17539681494235992, -0.16600622236728668, -0.15661561489105225, -0.147225022315979, -0.13783442974090576, -0.12844382226467133, -0.11905322968959808, -0.10966262966394424, -0.1002720296382904, -0.09088143706321716, -0.08149083703756332, -0.07210023701190948, -0.06270963698625565, -0.053319040685892105, -0.043928444385528564, -0.034537844359874725, -0.025147244334220886, -0.015756648033857346, -0.006366051733493805, 0.003024548292160034, 0.012415146455168724, 0.021805744618177414, 0.031196342781186104, 0.040586940944194794, 0.04997754096984863, 0.05936813727021217, 0.06875873357057571, 0.07814933359622955]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 4.0, 2.0, 13.0, 5.0, 16.0, 27.0, 31.0, 47.0, 53.0, 57.0, 67.0, 96.0, 90.0, 95.0, 91.0, 66.0, 60.0, 49.0, 36.0, 33.0, 22.0, 12.0, 11.0, 6.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0744444727897644, -0.07252074033021927, -0.07059701532125473, -0.0686732828617096, -0.06674955785274506, -0.06482582539319992, -0.06290209293365479, -0.06097836419939995, -0.05905463546514511, -0.057130906730890274, -0.05520717799663544, -0.0532834455370903, -0.051359716802835464, -0.04943598806858063, -0.04751225560903549, -0.045588526874780655, -0.04366479814052582, -0.04174106940627098, -0.039817340672016144, -0.03789360821247101, -0.03596987947821617, -0.034046150743961334, -0.0321224182844162, -0.03019868955016136, -0.028274960815906525, -0.026351232081651688, -0.0244275014847517, -0.022503770887851715, -0.020580042153596878, -0.01865631341934204, -0.016732582822442055, -0.014808853156864643, -0.012885123491287231, -0.01096139382570982, -0.009037664160132408, -0.0071139344945549965, -0.005190204828977585, -0.003266475163400173, -0.0013427454978227615, 0.0005809841677546501, 0.0025047138333320618, 0.004428443498909473, 0.006352173164486885, 0.008275902830064297, 0.010199632495641708, 0.01212336216121912, 0.014047091826796532, 0.015970822423696518, 0.017894551157951355, 0.019818279892206192, 0.02174201048910618, 0.023665741086006165, 0.025589469820261, 0.02751319855451584, 0.029436929151415825, 0.03136065974831581, 0.03328438848257065, 0.035208117216825485, 0.03713184595108032, 0.03905557841062546, 0.040979307144880295, 0.04290303587913513, 0.04482676833868027, 0.046750497072935104, 0.04867422580718994]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 6.0, 8.0, 12.0, 29.0, 40.0, 52.0, 78.0, 112.0, 167.0, 260.0, 383.0, 598.0, 941.0, 2102.0, 17034.0, 758098.0, 257925.0, 6991.0, 1492.0, 732.0, 465.0, 322.0, 247.0, 154.0, 98.0, 72.0, 51.0, 35.0, 21.0, 14.0, 7.0, 4.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0458984375, -0.044580936431884766, -0.04326343536376953, -0.0419459342956543, -0.04062843322753906, -0.03931093215942383, -0.037993431091308594, -0.03667593002319336, -0.035358428955078125, -0.03404092788696289, -0.032723426818847656, -0.03140592575073242, -0.030088424682617188, -0.028770923614501953, -0.02745342254638672, -0.026135921478271484, -0.02481842041015625, -0.023500919342041016, -0.02218341827392578, -0.020865917205810547, -0.019548416137695312, -0.018230915069580078, -0.016913414001464844, -0.01559591293334961, -0.014278411865234375, -0.01296091079711914, -0.011643409729003906, -0.010325908660888672, -0.009008407592773438, -0.007690906524658203, -0.006373405456542969, -0.005055904388427734, -0.0037384033203125, -0.0024209022521972656, -0.0011034011840820312, 0.00021409988403320312, 0.0015316009521484375, 0.002849102020263672, 0.004166603088378906, 0.005484104156494141, 0.006801605224609375, 0.00811910629272461, 0.009436607360839844, 0.010754108428955078, 0.012071609497070312, 0.013389110565185547, 0.014706611633300781, 0.016024112701416016, 0.01734161376953125, 0.018659114837646484, 0.01997661590576172, 0.021294116973876953, 0.022611618041992188, 0.023929119110107422, 0.025246620178222656, 0.02656412124633789, 0.027881622314453125, 0.02919912338256836, 0.030516624450683594, 0.03183412551879883, 0.03315162658691406, 0.0344691276550293, 0.03578662872314453, 0.037104129791259766, 0.038421630859375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 13.0, 34.0, 122.0, 214.0, 230.0, 211.0, 117.0, 35.0, 12.0, 9.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0191192626953125, -0.018492460250854492, -0.017865657806396484, -0.017238855361938477, -0.01661205291748047, -0.01598525047302246, -0.015358448028564453, -0.014731645584106445, -0.014104843139648438, -0.01347804069519043, -0.012851238250732422, -0.012224435806274414, -0.011597633361816406, -0.010970830917358398, -0.01034402847290039, -0.009717226028442383, -0.009090423583984375, -0.008463621139526367, -0.00783681869506836, -0.0072100162506103516, -0.006583213806152344, -0.005956411361694336, -0.005329608917236328, -0.00470280647277832, -0.0040760040283203125, -0.0034492015838623047, -0.002822399139404297, -0.002195596694946289, -0.0015687942504882812, -0.0009419918060302734, -0.0003151893615722656, 0.0003116130828857422, 0.00093841552734375, 0.0015652179718017578, 0.0021920204162597656, 0.0028188228607177734, 0.0034456253051757812, 0.004072427749633789, 0.004699230194091797, 0.005326032638549805, 0.0059528350830078125, 0.00657963752746582, 0.007206439971923828, 0.007833242416381836, 0.008460044860839844, 0.009086847305297852, 0.00971364974975586, 0.010340452194213867, 0.010967254638671875, 0.011594057083129883, 0.01222085952758789, 0.012847661972045898, 0.013474464416503906, 0.014101266860961914, 0.014728069305419922, 0.01535487174987793, 0.015981674194335938, 0.016608476638793945, 0.017235279083251953, 0.01786208152770996, 0.01848888397216797, 0.019115686416625977, 0.019742488861083984, 0.020369291305541992, 0.02099609375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 9.0, 3.0, 15.0, 17.0, 22.0, 27.0, 34.0, 46.0, 49.0, 72.0, 85.0, 139.0, 187.0, 339.0, 603.0, 1094.0, 2457.0, 6196.0, 20237.0, 87947.0, 386308.0, 411359.0, 96816.0, 22482.0, 6657.0, 2521.0, 1141.0, 617.0, 339.0, 206.0, 125.0, 99.0, 86.0, 55.0, 31.0, 39.0, 21.0, 15.0, 15.0, 9.0, 8.0, 11.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.01233673095703125, -0.011925935745239258, -0.011515140533447266, -0.011104345321655273, -0.010693550109863281, -0.010282754898071289, -0.009871959686279297, -0.009461164474487305, -0.009050369262695312, -0.00863957405090332, -0.008228778839111328, -0.007817983627319336, -0.007407188415527344, -0.0069963932037353516, -0.006585597991943359, -0.006174802780151367, -0.005764007568359375, -0.005353212356567383, -0.004942417144775391, -0.0045316219329833984, -0.004120826721191406, -0.003710031509399414, -0.003299236297607422, -0.0028884410858154297, -0.0024776458740234375, -0.0020668506622314453, -0.0016560554504394531, -0.001245260238647461, -0.0008344650268554688, -0.00042366981506347656, -1.2874603271484375e-05, 0.0003979206085205078, 0.0008087158203125, 0.0012195110321044922, 0.0016303062438964844, 0.0020411014556884766, 0.0024518966674804688, 0.002862691879272461, 0.003273487091064453, 0.0036842823028564453, 0.0040950775146484375, 0.00450587272644043, 0.004916667938232422, 0.005327463150024414, 0.005738258361816406, 0.0061490535736083984, 0.006559848785400391, 0.006970643997192383, 0.007381439208984375, 0.007792234420776367, 0.00820302963256836, 0.008613824844360352, 0.009024620056152344, 0.009435415267944336, 0.009846210479736328, 0.01025700569152832, 0.010667800903320312, 0.011078596115112305, 0.011489391326904297, 0.011900186538696289, 0.012310981750488281, 0.012721776962280273, 0.013132572174072266, 0.013543367385864258, 0.01395416259765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 14.0, 10.0, 17.0, 15.0, 28.0, 27.0, 22.0, 26.0, 38.0, 27.0, 46.0, 44.0, 31.0, 50.0, 54.0, 40.0, 47.0, 44.0, 45.0, 48.0, 51.0, 46.0, 28.0, 32.0, 25.0, 27.0, 19.0, 11.0, 12.0, 13.0, 11.0, 5.0, 10.0, 4.0, 6.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.011688232421875, -0.0113145112991333, -0.010940790176391602, -0.010567069053649902, -0.010193347930908203, -0.009819626808166504, -0.009445905685424805, -0.009072184562683105, -0.008698463439941406, -0.008324742317199707, -0.007951021194458008, -0.007577300071716309, -0.007203578948974609, -0.00682985782623291, -0.006456136703491211, -0.006082415580749512, -0.0057086944580078125, -0.005334973335266113, -0.004961252212524414, -0.004587531089782715, -0.004213809967041016, -0.0038400888442993164, -0.003466367721557617, -0.003092646598815918, -0.0027189254760742188, -0.0023452043533325195, -0.0019714832305908203, -0.001597762107849121, -0.0012240409851074219, -0.0008503198623657227, -0.00047659873962402344, -0.00010287761688232422, 0.000270843505859375, 0.0006445646286010742, 0.0010182857513427734, 0.0013920068740844727, 0.0017657279968261719, 0.002139449119567871, 0.0025131702423095703, 0.0028868913650512695, 0.0032606124877929688, 0.003634333610534668, 0.004008054733276367, 0.004381775856018066, 0.004755496978759766, 0.005129218101501465, 0.005502939224243164, 0.005876660346984863, 0.0062503814697265625, 0.006624102592468262, 0.006997823715209961, 0.00737154483795166, 0.007745265960693359, 0.008118987083435059, 0.008492708206176758, 0.008866429328918457, 0.009240150451660156, 0.009613871574401855, 0.009987592697143555, 0.010361313819885254, 0.010735034942626953, 0.011108756065368652, 0.011482477188110352, 0.01185619831085205, 0.01222991943359375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 7.0, 3.0, 11.0, 4.0, 13.0, 18.0, 23.0, 29.0, 50.0, 100.0, 154.0, 269.0, 448.0, 787.0, 1550.0, 3178.0, 9135.0, 54608.0, 707963.0, 239944.0, 20129.0, 5285.0, 2213.0, 1125.0, 623.0, 332.0, 226.0, 108.0, 79.0, 41.0, 24.0, 21.0, 8.0, 9.0, 13.0, 5.0, 8.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00786590576171875, -0.0076258182525634766, -0.007385730743408203, -0.00714564323425293, -0.006905555725097656, -0.006665468215942383, -0.006425380706787109, -0.006185293197631836, -0.0059452056884765625, -0.005705118179321289, -0.005465030670166016, -0.005224943161010742, -0.004984855651855469, -0.004744768142700195, -0.004504680633544922, -0.0042645931243896484, -0.004024505615234375, -0.0037844181060791016, -0.003544330596923828, -0.0033042430877685547, -0.0030641555786132812, -0.002824068069458008, -0.0025839805603027344, -0.002343893051147461, -0.0021038055419921875, -0.001863718032836914, -0.0016236305236816406, -0.0013835430145263672, -0.0011434555053710938, -0.0009033679962158203, -0.0006632804870605469, -0.00042319297790527344, -0.00018310546875, 5.698204040527344e-05, 0.0002970695495605469, 0.0005371570587158203, 0.0007772445678710938, 0.0010173320770263672, 0.0012574195861816406, 0.001497507095336914, 0.0017375946044921875, 0.001977682113647461, 0.0022177696228027344, 0.002457857131958008, 0.0026979446411132812, 0.0029380321502685547, 0.003178119659423828, 0.0034182071685791016, 0.003658294677734375, 0.0038983821868896484, 0.004138469696044922, 0.004378557205200195, 0.004618644714355469, 0.004858732223510742, 0.005098819732666016, 0.005338907241821289, 0.0055789947509765625, 0.005819082260131836, 0.006059169769287109, 0.006299257278442383, 0.006539344787597656, 0.00677943229675293, 0.007019519805908203, 0.0072596073150634766, 0.00749969482421875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 12.0, 10.0, 17.0, 24.0, 26.0, 53.0, 36.0, 65.0, 55.0, 65.0, 69.0, 82.0, 83.0, 69.0, 67.0, 52.0, 43.0, 33.0, 26.0, 19.0, 13.0, 20.0, 9.0, 7.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.730722427368164e-05, -7.440242916345596e-05, -7.149763405323029e-05, -6.859283894300461e-05, -6.568804383277893e-05, -6.278324872255325e-05, -5.9878453612327576e-05, -5.69736585021019e-05, -5.406886339187622e-05, -5.116406828165054e-05, -4.8259273171424866e-05, -4.535447806119919e-05, -4.244968295097351e-05, -3.954488784074783e-05, -3.6640092730522156e-05, -3.373529762029648e-05, -3.08305025100708e-05, -2.7925707399845123e-05, -2.5020912289619446e-05, -2.211611717939377e-05, -1.921132206916809e-05, -1.6306526958942413e-05, -1.3401731848716736e-05, -1.0496936738491058e-05, -7.592141628265381e-06, -4.687346518039703e-06, -1.7825514078140259e-06, 1.1222437024116516e-06, 4.027038812637329e-06, 6.931833922863007e-06, 9.836629033088684e-06, 1.2741424143314362e-05, 1.564621925354004e-05, 1.8551014363765717e-05, 2.1455809473991394e-05, 2.436060458421707e-05, 2.726539969444275e-05, 3.0170194804668427e-05, 3.3074989914894104e-05, 3.597978502511978e-05, 3.888458013534546e-05, 4.1789375245571136e-05, 4.4694170355796814e-05, 4.759896546602249e-05, 5.050376057624817e-05, 5.3408555686473846e-05, 5.6313350796699524e-05, 5.92181459069252e-05, 6.212294101715088e-05, 6.502773612737656e-05, 6.793253123760223e-05, 7.083732634782791e-05, 7.374212145805359e-05, 7.664691656827927e-05, 7.955171167850494e-05, 8.245650678873062e-05, 8.53613018989563e-05, 8.826609700918198e-05, 9.117089211940765e-05, 9.407568722963333e-05, 9.698048233985901e-05, 9.988527745008469e-05, 0.00010279007256031036, 0.00010569486767053604, 0.00010859966278076172]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 6.0, 3.0, 12.0, 9.0, 9.0, 14.0, 16.0, 41.0, 68.0, 124.0, 229.0, 461.0, 836.0, 1542.0, 3532.0, 13105.0, 266729.0, 728251.0, 24686.0, 4752.0, 1916.0, 1064.0, 503.0, 292.0, 161.0, 77.0, 50.0, 12.0, 12.0, 10.0, 8.0, 6.0, 6.0, 9.0, 3.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01268768310546875, -0.012326717376708984, -0.011965751647949219, -0.011604785919189453, -0.011243820190429688, -0.010882854461669922, -0.010521888732910156, -0.01016092300415039, -0.009799957275390625, -0.00943899154663086, -0.009078025817871094, -0.008717060089111328, -0.008356094360351562, -0.007995128631591797, -0.007634162902832031, -0.007273197174072266, -0.0069122314453125, -0.006551265716552734, -0.006190299987792969, -0.005829334259033203, -0.0054683685302734375, -0.005107402801513672, -0.004746437072753906, -0.004385471343994141, -0.004024505615234375, -0.0036635398864746094, -0.0033025741577148438, -0.002941608428955078, -0.0025806427001953125, -0.002219676971435547, -0.0018587112426757812, -0.0014977455139160156, -0.00113677978515625, -0.0007758140563964844, -0.00041484832763671875, -5.3882598876953125e-05, 0.0003070831298828125, 0.0006680488586425781, 0.0010290145874023438, 0.0013899803161621094, 0.001750946044921875, 0.0021119117736816406, 0.0024728775024414062, 0.002833843231201172, 0.0031948089599609375, 0.003555774688720703, 0.003916740417480469, 0.004277706146240234, 0.004638671875, 0.004999637603759766, 0.005360603332519531, 0.005721569061279297, 0.0060825347900390625, 0.006443500518798828, 0.006804466247558594, 0.007165431976318359, 0.007526397705078125, 0.00788736343383789, 0.008248329162597656, 0.008609294891357422, 0.008970260620117188, 0.009331226348876953, 0.009692192077636719, 0.010053157806396484, 0.01041412353515625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 8.0, 4.0, 9.0, 16.0, 10.0, 19.0, 26.0, 33.0, 45.0, 63.0, 76.0, 101.0, 115.0, 115.0, 79.0, 65.0, 42.0, 38.0, 41.0, 25.0, 21.0, 20.0, 10.0, 8.0, 7.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0045013427734375, -0.004375845193862915, -0.00425034761428833, -0.004124850034713745, -0.00399935245513916, -0.003873854875564575, -0.0037483572959899902, -0.0036228597164154053, -0.0034973621368408203, -0.0033718645572662354, -0.0032463669776916504, -0.0031208693981170654, -0.0029953718185424805, -0.0028698742389678955, -0.0027443766593933105, -0.0026188790798187256, -0.0024933815002441406, -0.0023678839206695557, -0.0022423863410949707, -0.0021168887615203857, -0.0019913911819458008, -0.0018658936023712158, -0.0017403960227966309, -0.001614898443222046, -0.001489400863647461, -0.001363903284072876, -0.001238405704498291, -0.001112908124923706, -0.000987410545349121, -0.0008619129657745361, -0.0007364153861999512, -0.0006109178066253662, -0.00048542022705078125, -0.0003599226474761963, -0.00023442506790161133, -0.00010892748832702637, 1.6570091247558594e-05, 0.00014206767082214355, 0.0002675652503967285, 0.0003930628299713135, 0.0005185604095458984, 0.0006440579891204834, 0.0007695555686950684, 0.0008950531482696533, 0.0010205507278442383, 0.0011460483074188232, 0.0012715458869934082, 0.0013970434665679932, 0.0015225410461425781, 0.001648038625717163, 0.001773536205291748, 0.001899033784866333, 0.002024531364440918, 0.002150028944015503, 0.002275526523590088, 0.002401024103164673, 0.002526521682739258, 0.0026520192623138428, 0.0027775168418884277, 0.0029030144214630127, 0.0030285120010375977, 0.0031540095806121826, 0.0032795071601867676, 0.0034050047397613525, 0.0035305023193359375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 25.0, 246.0, 547.0, 154.0, 26.0, 8.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03863357752561569, -0.03248655050992966, -0.02633952535688877, -0.020192500203847885, -0.01404547318816185, -0.007898446172475815, -0.0017514228820800781, 0.004395604133605957, 0.010542631149291992, 0.016689658164978027, 0.022836683318018913, 0.0289837084710598, 0.035130735486745834, 0.04127776250243187, 0.047424785792827606, 0.05357181280851364, 0.059718839824199677, 0.06586586683988571, 0.07201289385557175, 0.07815991342067719, 0.08430694043636322, 0.09045396745204926, 0.09660099446773529, 0.10274802148342133, 0.10889504849910736, 0.1150420755147934, 0.12118910253047943, 0.12733612954616547, 0.1334831565618515, 0.13963018357753754, 0.14577719569206238, 0.1519242227077484, 0.15807124972343445, 0.16421827673912048, 0.17036530375480652, 0.17651233077049255, 0.1826593577861786, 0.18880638480186462, 0.19495341181755066, 0.2011004388332367, 0.20724746584892273, 0.21339449286460876, 0.2195415198802948, 0.22568854689598083, 0.23183557391166687, 0.2379826009273529, 0.24412962794303894, 0.250276654958725, 0.2564236521720886, 0.26257067918777466, 0.2687177062034607, 0.27486473321914673, 0.28101176023483276, 0.2871587872505188, 0.29330581426620483, 0.29945284128189087, 0.3055998682975769, 0.31174689531326294, 0.317893922328949, 0.324040949344635, 0.33018797636032104, 0.3363350033760071, 0.3424820303916931, 0.34862905740737915, 0.3547760844230652]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 2.0, 13.0, 6.0, 7.0, 11.0, 16.0, 16.0, 8.0, 21.0, 16.0, 23.0, 29.0, 32.0, 31.0, 36.0, 31.0, 48.0, 53.0, 46.0, 39.0, 33.0, 45.0, 44.0, 29.0, 41.0, 39.0, 35.0, 20.0, 32.0, 17.0, 22.0, 23.0, 17.0, 24.0, 16.0, 17.0, 12.0, 15.0, 6.0, 10.0, 8.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.03021639585494995, -0.029295291751623154, -0.028374185785651207, -0.02745307981967926, -0.026531975716352463, -0.025610871613025665, -0.02468976564705372, -0.023768659681081772, -0.022847555577754974, -0.021926451474428177, -0.02100534550845623, -0.020084239542484283, -0.019163135439157486, -0.01824203133583069, -0.017320925369858742, -0.016399819403886795, -0.015478715300559998, -0.014557610265910625, -0.013636505231261253, -0.012715400196611881, -0.01179429516196251, -0.010873190127313137, -0.009952085092663765, -0.009030980058014393, -0.00810987502336502, -0.007188769988715649, -0.0062676649540662766, -0.0053465599194169044, -0.004425454884767532, -0.0035043498501181602, -0.002583244815468788, -0.001662139780819416, -0.0007410347461700439, 0.00018007028847932816, 0.0011011753231287003, 0.0020222803577780724, 0.0029433853924274445, 0.0038644904270768166, 0.004785595461726189, 0.005706700496375561, 0.006627805531024933, 0.007548910565674305, 0.008470015600323677, 0.00939112063497305, 0.010312225669622421, 0.011233330704271793, 0.012154435738921165, 0.013075540773570538, 0.01399664580821991, 0.014917750842869282, 0.015838855877518654, 0.0167599618434906, 0.017681065946817398, 0.018602170050144196, 0.019523276016116142, 0.02044438198208809, 0.021365486085414886, 0.022286590188741684, 0.02320769615471363, 0.024128802120685577, 0.025049906224012375, 0.025971010327339172, 0.02689211629331112, 0.027813222259283066, 0.028734326362609863]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 5.0, 5.0, 9.0, 14.0, 16.0, 20.0, 32.0, 39.0, 49.0, 99.0, 121.0, 194.0, 292.0, 498.0, 1248.0, 2722.0, 5922.0, 50506.0, 4004970.0, 112516.0, 9873.0, 2991.0, 895.0, 435.0, 203.0, 174.0, 95.0, 76.0, 54.0, 59.0, 39.0, 17.0, 16.0, 15.0, 8.0, 14.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.0269775390625, -0.026124000549316406, -0.025270462036132812, -0.02441692352294922, -0.023563385009765625, -0.02270984649658203, -0.021856307983398438, -0.021002769470214844, -0.02014923095703125, -0.019295692443847656, -0.018442153930664062, -0.01758861541748047, -0.016735076904296875, -0.01588153839111328, -0.015027999877929688, -0.014174461364746094, -0.0133209228515625, -0.012467384338378906, -0.011613845825195312, -0.010760307312011719, -0.009906768798828125, -0.009053230285644531, -0.008199691772460938, -0.007346153259277344, -0.00649261474609375, -0.005639076232910156, -0.0047855377197265625, -0.003931999206542969, -0.003078460693359375, -0.0022249221801757812, -0.0013713836669921875, -0.0005178451538085938, 0.000335693359375, 0.0011892318725585938, 0.0020427703857421875, 0.0028963088989257812, 0.003749847412109375, 0.004603385925292969, 0.0054569244384765625, 0.006310462951660156, 0.00716400146484375, 0.008017539978027344, 0.008871078491210938, 0.009724617004394531, 0.010578155517578125, 0.011431694030761719, 0.012285232543945312, 0.013138771057128906, 0.0139923095703125, 0.014845848083496094, 0.015699386596679688, 0.01655292510986328, 0.017406463623046875, 0.01826000213623047, 0.019113540649414062, 0.019967079162597656, 0.02082061767578125, 0.021674156188964844, 0.022527694702148438, 0.02338123321533203, 0.024234771728515625, 0.02508831024169922, 0.025941848754882812, 0.026795387268066406, 0.02764892578125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 38.0, 104.0, 209.0, 215.0, 224.0, 125.0, 52.0, 14.0, 10.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0180816650390625, -0.017450809478759766, -0.01681995391845703, -0.016189098358154297, -0.015558242797851562, -0.014927387237548828, -0.014296531677246094, -0.01366567611694336, -0.013034820556640625, -0.01240396499633789, -0.011773109436035156, -0.011142253875732422, -0.010511398315429688, -0.009880542755126953, -0.009249687194824219, -0.008618831634521484, -0.00798797607421875, -0.007357120513916016, -0.006726264953613281, -0.006095409393310547, -0.0054645538330078125, -0.004833698272705078, -0.004202842712402344, -0.0035719871520996094, -0.002941131591796875, -0.0023102760314941406, -0.0016794204711914062, -0.0010485649108886719, -0.0004177093505859375, 0.00021314620971679688, 0.0008440017700195312, 0.0014748573303222656, 0.002105712890625, 0.0027365684509277344, 0.0033674240112304688, 0.003998279571533203, 0.0046291351318359375, 0.005259990692138672, 0.005890846252441406, 0.006521701812744141, 0.007152557373046875, 0.007783412933349609, 0.008414268493652344, 0.009045124053955078, 0.009675979614257812, 0.010306835174560547, 0.010937690734863281, 0.011568546295166016, 0.01219940185546875, 0.012830257415771484, 0.013461112976074219, 0.014091968536376953, 0.014722824096679688, 0.015353679656982422, 0.015984535217285156, 0.01661539077758789, 0.017246246337890625, 0.01787710189819336, 0.018507957458496094, 0.019138813018798828, 0.019769668579101562, 0.020400524139404297, 0.02103137969970703, 0.021662235260009766, 0.0222930908203125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 7.0, 10.0, 21.0, 24.0, 39.0, 64.0, 107.0, 193.0, 356.0, 680.0, 1521.0, 3857.0, 14289.0, 102796.0, 3650442.0, 378954.0, 30339.0, 6568.0, 2172.0, 869.0, 463.0, 201.0, 124.0, 58.0, 41.0, 33.0, 16.0, 14.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0107574462890625, -0.010262012481689453, -0.009766578674316406, -0.00927114486694336, -0.008775711059570312, -0.008280277252197266, -0.007784843444824219, -0.007289409637451172, -0.006793975830078125, -0.006298542022705078, -0.005803108215332031, -0.005307674407958984, -0.0048122406005859375, -0.004316806793212891, -0.0038213729858398438, -0.003325939178466797, -0.00283050537109375, -0.002335071563720703, -0.0018396377563476562, -0.0013442039489746094, -0.0008487701416015625, -0.0003533363342285156, 0.00014209747314453125, 0.0006375312805175781, 0.001132965087890625, 0.0016283988952636719, 0.0021238327026367188, 0.0026192665100097656, 0.0031147003173828125, 0.0036101341247558594, 0.004105567932128906, 0.004601001739501953, 0.005096435546875, 0.005591869354248047, 0.006087303161621094, 0.006582736968994141, 0.0070781707763671875, 0.007573604583740234, 0.008069038391113281, 0.008564472198486328, 0.009059906005859375, 0.009555339813232422, 0.010050773620605469, 0.010546207427978516, 0.011041641235351562, 0.01153707504272461, 0.012032508850097656, 0.012527942657470703, 0.01302337646484375, 0.013518810272216797, 0.014014244079589844, 0.01450967788696289, 0.015005111694335938, 0.015500545501708984, 0.01599597930908203, 0.016491413116455078, 0.016986846923828125, 0.017482280731201172, 0.01797771453857422, 0.018473148345947266, 0.018968582153320312, 0.01946401596069336, 0.019959449768066406, 0.020454883575439453, 0.0209503173828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 4.0, 10.0, 17.0, 25.0, 32.0, 65.0, 79.0, 175.0, 453.0, 1215.0, 1052.0, 400.0, 184.0, 99.0, 77.0, 47.0, 39.0, 23.0, 18.0, 11.0, 7.0, 6.0, 8.0, 4.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01050567626953125, -0.010186433792114258, -0.009867191314697266, -0.009547948837280273, -0.009228706359863281, -0.008909463882446289, -0.008590221405029297, -0.008270978927612305, -0.007951736450195312, -0.00763249397277832, -0.007313251495361328, -0.006994009017944336, -0.006674766540527344, -0.0063555240631103516, -0.006036281585693359, -0.005717039108276367, -0.005397796630859375, -0.005078554153442383, -0.004759311676025391, -0.0044400691986083984, -0.004120826721191406, -0.003801584243774414, -0.003482341766357422, -0.0031630992889404297, -0.0028438568115234375, -0.0025246143341064453, -0.002205371856689453, -0.001886129379272461, -0.0015668869018554688, -0.0012476444244384766, -0.0009284019470214844, -0.0006091594696044922, -0.0002899169921875, 2.9325485229492188e-05, 0.0003485679626464844, 0.0006678104400634766, 0.0009870529174804688, 0.001306295394897461, 0.0016255378723144531, 0.0019447803497314453, 0.0022640228271484375, 0.0025832653045654297, 0.002902507781982422, 0.003221750259399414, 0.0035409927368164062, 0.0038602352142333984, 0.004179477691650391, 0.004498720169067383, 0.004817962646484375, 0.005137205123901367, 0.005456447601318359, 0.0057756900787353516, 0.006094932556152344, 0.006414175033569336, 0.006733417510986328, 0.00705265998840332, 0.0073719024658203125, 0.007691144943237305, 0.008010387420654297, 0.008329629898071289, 0.008648872375488281, 0.008968114852905273, 0.009287357330322266, 0.009606599807739258, 0.00992584228515625]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 34.0, 366.0, 505.0, 82.0, 11.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20076274871826172, -0.19598011672496796, -0.1911974847316742, -0.18641485273838043, -0.18163222074508667, -0.1768496036529541, -0.17206695675849915, -0.16728433966636658, -0.16250170767307281, -0.15771907567977905, -0.1529364436864853, -0.14815381169319153, -0.14337117969989777, -0.138588547706604, -0.13380593061447144, -0.12902329862117767, -0.12424065917730331, -0.11945802718400955, -0.11467539519071579, -0.10989277064800262, -0.10511013865470886, -0.1003275066614151, -0.09554487466812134, -0.09076224267482758, -0.08597961068153381, -0.08119697868824005, -0.07641434669494629, -0.07163171470165253, -0.06684909015893936, -0.0620664581656456, -0.05728382617235184, -0.05250119790434837, -0.04771857708692551, -0.042935945093631744, -0.03815331682562828, -0.03337068483233452, -0.028588054701685905, -0.023805424571037292, -0.01902279257774353, -0.014240164309740067, -0.009457532316446304, -0.004674901720136404, 0.00010772887617349625, 0.004890359938144684, 0.009672990068793297, 0.01445562019944191, 0.019238252192735672, 0.024020880460739136, 0.028803512454032898, 0.03358614444732666, 0.038368772715330124, 0.043151404708623886, 0.04793403297662735, 0.05271666496992111, 0.057499296963214874, 0.06228192523121834, 0.0670645534992218, 0.07184718549251556, 0.07662981748580933, 0.08141244947910309, 0.08619507402181625, 0.09097770601511002, 0.09576033800840378, 0.10054296255111694, 0.1053256019949913]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 8.0, 8.0, 10.0, 15.0, 18.0, 23.0, 34.0, 34.0, 47.0, 57.0, 64.0, 72.0, 67.0, 67.0, 60.0, 61.0, 78.0, 61.0, 39.0, 38.0, 34.0, 23.0, 17.0, 11.0, 20.0, 13.0, 10.0, 1.0, 6.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02980595827102661, -0.02871539816260338, -0.027624839916825294, -0.02653428167104721, -0.025443721562623978, -0.024353161454200745, -0.02326260320842266, -0.022172044962644577, -0.021081484854221344, -0.01999092474579811, -0.018900366500020027, -0.017809808254241943, -0.01671924814581871, -0.015628688037395477, -0.014538129791617393, -0.013447570614516735, -0.012357011437416077, -0.011266452260315418, -0.01017589308321476, -0.009085333906114101, -0.007994774729013443, -0.006904215551912785, -0.005813656374812126, -0.004723097197711468, -0.0036325380206108093, -0.002541978843510151, -0.0014514196664094925, -0.0003608604893088341, 0.0007296986877918243, 0.0018202578648924828, 0.002910817041993141, 0.0040013762190938, 0.005091935396194458, 0.006182494573295116, 0.007273053750395775, 0.008363612927496433, 0.009454172104597092, 0.01054473128169775, 0.011635290458798409, 0.012725849635899067, 0.013816408812999725, 0.014906967990100384, 0.015997527167201042, 0.017088085412979126, 0.01817864552140236, 0.019269205629825592, 0.020359763875603676, 0.02145032212138176, 0.022540882229804993, 0.023631442338228226, 0.02472200058400631, 0.025812558829784393, 0.026903118938207626, 0.02799367904663086, 0.029084237292408943, 0.030174795538187027, 0.03126535564661026, 0.03235591575503349, 0.033446475863456726, 0.03453703224658966, 0.035627592355012894, 0.03671815246343613, 0.03780870884656906, 0.038899268954992294, 0.03998982906341553]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 5.0, 15.0, 11.0, 15.0, 24.0, 37.0, 32.0, 65.0, 88.0, 93.0, 150.0, 183.0, 313.0, 461.0, 699.0, 1358.0, 3938.0, 33812.0, 783884.0, 208545.0, 9862.0, 2091.0, 967.0, 545.0, 396.0, 256.0, 200.0, 147.0, 97.0, 66.0, 48.0, 40.0, 28.0, 18.0, 11.0, 11.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0236358642578125, -0.022814035415649414, -0.021992206573486328, -0.021170377731323242, -0.020348548889160156, -0.01952672004699707, -0.018704891204833984, -0.0178830623626709, -0.017061233520507812, -0.016239404678344727, -0.01541757583618164, -0.014595746994018555, -0.013773918151855469, -0.012952089309692383, -0.012130260467529297, -0.011308431625366211, -0.010486602783203125, -0.009664773941040039, -0.008842945098876953, -0.008021116256713867, -0.007199287414550781, -0.006377458572387695, -0.005555629730224609, -0.0047338008880615234, -0.0039119720458984375, -0.0030901432037353516, -0.0022683143615722656, -0.0014464855194091797, -0.0006246566772460938, 0.0001971721649169922, 0.0010190010070800781, 0.001840829849243164, 0.00266265869140625, 0.003484487533569336, 0.004306316375732422, 0.005128145217895508, 0.005949974060058594, 0.00677180290222168, 0.007593631744384766, 0.008415460586547852, 0.009237289428710938, 0.010059118270874023, 0.01088094711303711, 0.011702775955200195, 0.012524604797363281, 0.013346433639526367, 0.014168262481689453, 0.014990091323852539, 0.015811920166015625, 0.01663374900817871, 0.017455577850341797, 0.018277406692504883, 0.01909923553466797, 0.019921064376831055, 0.02074289321899414, 0.021564722061157227, 0.022386550903320312, 0.0232083797454834, 0.024030208587646484, 0.02485203742980957, 0.025673866271972656, 0.026495695114135742, 0.027317523956298828, 0.028139352798461914, 0.028961181640625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 16.0, 54.0, 142.0, 193.0, 212.0, 205.0, 100.0, 50.0, 16.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.01806640625, -0.017472267150878906, -0.016878128051757812, -0.01628398895263672, -0.015689849853515625, -0.015095710754394531, -0.014501571655273438, -0.013907432556152344, -0.01331329345703125, -0.012719154357910156, -0.012125015258789062, -0.011530876159667969, -0.010936737060546875, -0.010342597961425781, -0.009748458862304688, -0.009154319763183594, -0.0085601806640625, -0.007966041564941406, -0.0073719024658203125, -0.006777763366699219, -0.006183624267578125, -0.005589485168457031, -0.0049953460693359375, -0.004401206970214844, -0.00380706787109375, -0.0032129287719726562, -0.0026187896728515625, -0.0020246505737304688, -0.001430511474609375, -0.0008363723754882812, -0.0002422332763671875, 0.00035190582275390625, 0.000946044921875, 0.0015401840209960938, 0.0021343231201171875, 0.0027284622192382812, 0.003322601318359375, 0.003916740417480469, 0.0045108795166015625, 0.005105018615722656, 0.00569915771484375, 0.006293296813964844, 0.0068874359130859375, 0.007481575012207031, 0.008075714111328125, 0.008669853210449219, 0.009263992309570312, 0.009858131408691406, 0.0104522705078125, 0.011046409606933594, 0.011640548706054688, 0.012234687805175781, 0.012828826904296875, 0.013422966003417969, 0.014017105102539062, 0.014611244201660156, 0.01520538330078125, 0.015799522399902344, 0.016393661499023438, 0.01698780059814453, 0.017581939697265625, 0.01817607879638672, 0.018770217895507812, 0.019364356994628906, 0.01995849609375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 5.0, 4.0, 6.0, 5.0, 8.0, 8.0, 12.0, 11.0, 25.0, 15.0, 16.0, 32.0, 35.0, 50.0, 54.0, 58.0, 87.0, 130.0, 185.0, 408.0, 807.0, 2094.0, 6472.0, 25940.0, 141010.0, 570664.0, 244361.0, 41529.0, 9328.0, 2790.0, 1060.0, 474.0, 235.0, 142.0, 92.0, 85.0, 57.0, 66.0, 36.0, 35.0, 30.0, 16.0, 27.0, 17.0, 8.0, 8.0, 6.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.012847900390625, -0.012466073036193848, -0.012084245681762695, -0.011702418327331543, -0.01132059097290039, -0.010938763618469238, -0.010556936264038086, -0.010175108909606934, -0.009793281555175781, -0.009411454200744629, -0.009029626846313477, -0.008647799491882324, -0.008265972137451172, -0.00788414478302002, -0.007502317428588867, -0.007120490074157715, -0.0067386627197265625, -0.00635683536529541, -0.005975008010864258, -0.0055931806564331055, -0.005211353302001953, -0.004829525947570801, -0.0044476985931396484, -0.004065871238708496, -0.0036840438842773438, -0.0033022165298461914, -0.002920389175415039, -0.0025385618209838867, -0.0021567344665527344, -0.001774907112121582, -0.0013930797576904297, -0.0010112524032592773, -0.000629425048828125, -0.00024759769439697266, 0.0001342296600341797, 0.000516057014465332, 0.0008978843688964844, 0.0012797117233276367, 0.001661539077758789, 0.0020433664321899414, 0.0024251937866210938, 0.002807021141052246, 0.0031888484954833984, 0.0035706758499145508, 0.003952503204345703, 0.0043343305587768555, 0.004716157913208008, 0.00509798526763916, 0.0054798126220703125, 0.005861639976501465, 0.006243467330932617, 0.0066252946853637695, 0.007007122039794922, 0.007388949394226074, 0.0077707767486572266, 0.008152604103088379, 0.008534431457519531, 0.008916258811950684, 0.009298086166381836, 0.009679913520812988, 0.01006174087524414, 0.010443568229675293, 0.010825395584106445, 0.011207222938537598, 0.01158905029296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 0.0, 4.0, 5.0, 5.0, 4.0, 6.0, 3.0, 8.0, 16.0, 12.0, 7.0, 18.0, 15.0, 30.0, 33.0, 26.0, 20.0, 20.0, 21.0, 34.0, 32.0, 37.0, 42.0, 42.0, 37.0, 47.0, 46.0, 37.0, 32.0, 31.0, 25.0, 32.0, 33.0, 22.0, 23.0, 19.0, 24.0, 20.0, 23.0, 18.0, 19.0, 11.0, 11.0, 9.0, 7.0, 7.0, 12.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.00865936279296875, -0.008371472358703613, -0.008083581924438477, -0.00779569149017334, -0.007507801055908203, -0.007219910621643066, -0.00693202018737793, -0.006644129753112793, -0.006356239318847656, -0.0060683488845825195, -0.005780458450317383, -0.005492568016052246, -0.005204677581787109, -0.004916787147521973, -0.004628896713256836, -0.004341006278991699, -0.0040531158447265625, -0.0037652254104614258, -0.003477334976196289, -0.0031894445419311523, -0.0029015541076660156, -0.002613663673400879, -0.002325773239135742, -0.0020378828048706055, -0.0017499923706054688, -0.001462101936340332, -0.0011742115020751953, -0.0008863210678100586, -0.0005984306335449219, -0.00031054019927978516, -2.2649765014648438e-05, 0.0002652406692504883, 0.000553131103515625, 0.0008410215377807617, 0.0011289119720458984, 0.0014168024063110352, 0.0017046928405761719, 0.0019925832748413086, 0.0022804737091064453, 0.002568364143371582, 0.0028562545776367188, 0.0031441450119018555, 0.003432035446166992, 0.003719925880432129, 0.004007816314697266, 0.004295706748962402, 0.004583597183227539, 0.004871487617492676, 0.0051593780517578125, 0.005447268486022949, 0.005735158920288086, 0.006023049354553223, 0.006310939788818359, 0.006598830223083496, 0.006886720657348633, 0.0071746110916137695, 0.007462501525878906, 0.007750391960144043, 0.00803828239440918, 0.008326172828674316, 0.008614063262939453, 0.00890195369720459, 0.009189844131469727, 0.009477734565734863, 0.009765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 4.0, 12.0, 15.0, 24.0, 32.0, 62.0, 106.0, 144.0, 245.0, 518.0, 927.0, 1750.0, 3645.0, 9582.0, 30904.0, 152925.0, 613424.0, 180911.0, 34867.0, 10373.0, 4043.0, 1928.0, 962.0, 464.0, 255.0, 166.0, 95.0, 55.0, 32.0, 29.0, 14.0, 13.0, 9.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0041046142578125, -0.0039656758308410645, -0.003826737403869629, -0.0036877989768981934, -0.003548860549926758, -0.0034099221229553223, -0.0032709836959838867, -0.003132045269012451, -0.0029931068420410156, -0.00285416841506958, -0.0027152299880981445, -0.002576291561126709, -0.0024373531341552734, -0.002298414707183838, -0.0021594762802124023, -0.002020537853240967, -0.0018815994262695312, -0.0017426609992980957, -0.0016037225723266602, -0.0014647841453552246, -0.001325845718383789, -0.0011869072914123535, -0.001047968864440918, -0.0009090304374694824, -0.0007700920104980469, -0.0006311535835266113, -0.0004922151565551758, -0.00035327672958374023, -0.0002143383026123047, -7.539987564086914e-05, 6.35385513305664e-05, 0.00020247697830200195, 0.0003414154052734375, 0.00048035383224487305, 0.0006192922592163086, 0.0007582306861877441, 0.0008971691131591797, 0.0010361075401306152, 0.0011750459671020508, 0.0013139843940734863, 0.0014529228210449219, 0.0015918612480163574, 0.001730799674987793, 0.0018697381019592285, 0.002008676528930664, 0.0021476149559020996, 0.002286553382873535, 0.0024254918098449707, 0.0025644302368164062, 0.002703368663787842, 0.0028423070907592773, 0.002981245517730713, 0.0031201839447021484, 0.003259122371673584, 0.0033980607986450195, 0.003536999225616455, 0.0036759376525878906, 0.003814876079559326, 0.003953814506530762, 0.004092752933502197, 0.004231691360473633, 0.004370629787445068, 0.004509568214416504, 0.0046485066413879395, 0.004787445068359375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 9.0, 17.0, 22.0, 27.0, 63.0, 87.0, 129.0, 156.0, 149.0, 110.0, 67.0, 42.0, 33.0, 35.0, 21.0, 7.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022232532501220703, -0.00021508708596229553, -0.00020784884691238403, -0.00020061060786247253, -0.00019337236881256104, -0.00018613412976264954, -0.00017889589071273804, -0.00017165765166282654, -0.00016441941261291504, -0.00015718117356300354, -0.00014994293451309204, -0.00014270469546318054, -0.00013546645641326904, -0.00012822821736335754, -0.00012098997831344604, -0.00011375173926353455, -0.00010651350021362305, -9.927526116371155e-05, -9.203702211380005e-05, -8.479878306388855e-05, -7.756054401397705e-05, -7.032230496406555e-05, -6.308406591415405e-05, -5.5845826864242554e-05, -4.8607587814331055e-05, -4.1369348764419556e-05, -3.413110971450806e-05, -2.6892870664596558e-05, -1.965463161468506e-05, -1.241639256477356e-05, -5.1781535148620605e-06, 2.0600855350494385e-06, 9.298324584960938e-06, 1.6536563634872437e-05, 2.3774802684783936e-05, 3.1013041734695435e-05, 3.8251280784606934e-05, 4.548951983451843e-05, 5.272775888442993e-05, 5.996599793434143e-05, 6.720423698425293e-05, 7.444247603416443e-05, 8.168071508407593e-05, 8.891895413398743e-05, 9.615719318389893e-05, 0.00010339543223381042, 0.00011063367128372192, 0.00011787191033363342, 0.00012511014938354492, 0.00013234838843345642, 0.00013958662748336792, 0.00014682486653327942, 0.00015406310558319092, 0.00016130134463310242, 0.00016853958368301392, 0.00017577782273292542, 0.00018301606178283691, 0.0001902543008327484, 0.0001974925398826599, 0.0002047307789325714, 0.0002119690179824829, 0.0002192072570323944, 0.0002264454960823059, 0.0002336837351322174, 0.0002409219741821289]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 5.0, 2.0, 15.0, 13.0, 6.0, 11.0, 22.0, 21.0, 19.0, 43.0, 68.0, 118.0, 252.0, 565.0, 1274.0, 3142.0, 10643.0, 64941.0, 724934.0, 211641.0, 22096.0, 5265.0, 1882.0, 744.0, 335.0, 188.0, 95.0, 52.0, 37.0, 31.0, 20.0, 16.0, 10.0, 5.0, 6.0, 6.0, 9.0, 8.0, 0.0, 3.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.007289886474609375, -0.00706714391708374, -0.0068444013595581055, -0.006621658802032471, -0.006398916244506836, -0.006176173686981201, -0.005953431129455566, -0.005730688571929932, -0.005507946014404297, -0.005285203456878662, -0.005062460899353027, -0.004839718341827393, -0.004616975784301758, -0.004394233226776123, -0.004171490669250488, -0.0039487481117248535, -0.0037260055541992188, -0.003503262996673584, -0.0032805204391479492, -0.0030577778816223145, -0.0028350353240966797, -0.002612292766571045, -0.00238955020904541, -0.0021668076515197754, -0.0019440650939941406, -0.0017213225364685059, -0.001498579978942871, -0.0012758374214172363, -0.0010530948638916016, -0.0008303523063659668, -0.000607609748840332, -0.00038486719131469727, -0.0001621246337890625, 6.0617923736572266e-05, 0.00028336048126220703, 0.0005061030387878418, 0.0007288455963134766, 0.0009515881538391113, 0.001174330711364746, 0.0013970732688903809, 0.0016198158264160156, 0.0018425583839416504, 0.002065300941467285, 0.00228804349899292, 0.0025107860565185547, 0.0027335286140441895, 0.0029562711715698242, 0.003179013729095459, 0.0034017562866210938, 0.0036244988441467285, 0.0038472414016723633, 0.004069983959197998, 0.004292726516723633, 0.004515469074249268, 0.004738211631774902, 0.004960954189300537, 0.005183696746826172, 0.005406439304351807, 0.005629181861877441, 0.005851924419403076, 0.006074666976928711, 0.006297409534454346, 0.0065201520919799805, 0.006742894649505615, 0.00696563720703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 6.0, 13.0, 13.0, 24.0, 20.0, 49.0, 89.0, 120.0, 128.0, 153.0, 97.0, 71.0, 53.0, 54.0, 16.0, 12.0, 11.0, 6.0, 6.0, 6.0, 4.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00611114501953125, -0.0059320926666259766, -0.005753040313720703, -0.00557398796081543, -0.005394935607910156, -0.005215883255004883, -0.005036830902099609, -0.004857778549194336, -0.0046787261962890625, -0.004499673843383789, -0.004320621490478516, -0.004141569137573242, -0.003962516784667969, -0.0037834644317626953, -0.003604412078857422, -0.0034253597259521484, -0.003246307373046875, -0.0030672550201416016, -0.002888202667236328, -0.0027091503143310547, -0.0025300979614257812, -0.002351045608520508, -0.0021719932556152344, -0.001992940902709961, -0.0018138885498046875, -0.001634836196899414, -0.0014557838439941406, -0.0012767314910888672, -0.0010976791381835938, -0.0009186267852783203, -0.0007395744323730469, -0.0005605220794677734, -0.0003814697265625, -0.00020241737365722656, -2.3365020751953125e-05, 0.0001556873321533203, 0.00033473968505859375, 0.0005137920379638672, 0.0006928443908691406, 0.0008718967437744141, 0.0010509490966796875, 0.001230001449584961, 0.0014090538024902344, 0.0015881061553955078, 0.0017671585083007812, 0.0019462108612060547, 0.002125263214111328, 0.0023043155670166016, 0.002483367919921875, 0.0026624202728271484, 0.002841472625732422, 0.0030205249786376953, 0.0031995773315429688, 0.003378629684448242, 0.0035576820373535156, 0.003736734390258789, 0.0039157867431640625, 0.004094839096069336, 0.004273891448974609, 0.004452943801879883, 0.004631996154785156, 0.00481104850769043, 0.004990100860595703, 0.0051691532135009766, 0.00534820556640625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 849.0, 164.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0588495172560215, -0.03818943351507187, -0.017529349774122238, 0.0031307339668273926, 0.023790817707777023, 0.04445090517401695, 0.06511098146438599, 0.08577106893062592, 0.10643115639686584, 0.12709124386310577, 0.1477513313293457, 0.16841140389442444, 0.18907149136066437, 0.2097315788269043, 0.23039165139198303, 0.25105172395706177, 0.2717118263244629, 0.2923718988895416, 0.31303200125694275, 0.3336920738220215, 0.3543521761894226, 0.37501224875450134, 0.3956723213195801, 0.4163324236869812, 0.43699249625205994, 0.45765256881713867, 0.4783126711845398, 0.49897274374961853, 0.5196328163146973, 0.5402929186820984, 0.5609530210494995, 0.5816130638122559, 0.6022731065750122, 0.6229332089424133, 0.6435932517051697, 0.6642533540725708, 0.6849134564399719, 0.705573558807373, 0.7262336015701294, 0.7468937039375305, 0.7675538063049316, 0.7882139086723328, 0.8088739514350891, 0.8295340538024902, 0.8501941561698914, 0.8708542585372925, 0.8915143013000488, 0.91217440366745, 0.9328344464302063, 0.9534945487976074, 0.9741545915603638, 0.9948146939277649, 1.015474796295166, 1.0361348390579224, 1.0567950010299683, 1.0774550437927246, 1.098115086555481, 1.1187751293182373, 1.1394352912902832, 1.1600953340530396, 1.180755376815796, 1.2014155387878418, 1.2220755815505981, 1.2427356243133545, 1.2633957862854004]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 1.0, 3.0, 8.0, 13.0, 21.0, 19.0, 36.0, 34.0, 42.0, 40.0, 63.0, 63.0, 67.0, 77.0, 60.0, 87.0, 66.0, 52.0, 49.0, 55.0, 42.0, 26.0, 24.0, 17.0, 12.0, 13.0, 4.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.068867027759552, -0.06716986000537872, -0.06547269225120544, -0.06377552449703217, -0.06207835674285889, -0.06038118898868561, -0.05868402123451233, -0.05698685348033905, -0.05528968572616577, -0.05359251797199249, -0.051895350217819214, -0.050198182463645935, -0.048501014709472656, -0.04680384695529938, -0.0451066792011261, -0.04340951144695282, -0.04171234369277954, -0.04001517593860626, -0.03831800818443298, -0.036620840430259705, -0.034923672676086426, -0.03322650492191315, -0.03152933716773987, -0.02983216941356659, -0.02813500165939331, -0.026437833905220032, -0.024740666151046753, -0.023043498396873474, -0.021346330642700195, -0.019649162888526917, -0.017951995134353638, -0.01625482738018036, -0.01455765962600708, -0.012860491871833801, -0.011163324117660522, -0.009466156363487244, -0.007768988609313965, -0.006071820855140686, -0.004374653100967407, -0.0026774853467941284, -0.0009803175926208496, 0.0007168501615524292, 0.002414017915725708, 0.004111185669898987, 0.005808353424072266, 0.007505521178245544, 0.009202688932418823, 0.010899856686592102, 0.01259702444076538, 0.01429419219493866, 0.01599135994911194, 0.017688527703285217, 0.019385695457458496, 0.021082863211631775, 0.022780030965805054, 0.024477198719978333, 0.02617436647415161, 0.02787153422832489, 0.02956870198249817, 0.03126586973667145, 0.03296303749084473, 0.034660205245018005, 0.036357372999191284, 0.03805454075336456, 0.03975170850753784]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 8.0, 8.0, 12.0, 18.0, 22.0, 32.0, 48.0, 81.0, 113.0, 187.0, 294.0, 827.0, 2324.0, 7547.0, 450707.0, 3714472.0, 13616.0, 2527.0, 700.0, 253.0, 145.0, 104.0, 58.0, 47.0, 27.0, 24.0, 17.0, 13.0, 17.0, 5.0, 4.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0313720703125, -0.03036355972290039, -0.02935504913330078, -0.028346538543701172, -0.027338027954101562, -0.026329517364501953, -0.025321006774902344, -0.024312496185302734, -0.023303985595703125, -0.022295475006103516, -0.021286964416503906, -0.020278453826904297, -0.019269943237304688, -0.018261432647705078, -0.01725292205810547, -0.01624441146850586, -0.01523590087890625, -0.01422739028930664, -0.013218879699707031, -0.012210369110107422, -0.011201858520507812, -0.010193347930908203, -0.009184837341308594, -0.008176326751708984, -0.007167816162109375, -0.006159305572509766, -0.005150794982910156, -0.004142284393310547, -0.0031337738037109375, -0.002125263214111328, -0.0011167526245117188, -0.00010824203491210938, 0.0009002685546875, 0.0019087791442871094, 0.0029172897338867188, 0.003925800323486328, 0.0049343109130859375, 0.005942821502685547, 0.006951332092285156, 0.007959842681884766, 0.008968353271484375, 0.009976863861083984, 0.010985374450683594, 0.011993885040283203, 0.013002395629882812, 0.014010906219482422, 0.015019416809082031, 0.01602792739868164, 0.01703643798828125, 0.01804494857788086, 0.01905345916748047, 0.020061969757080078, 0.021070480346679688, 0.022078990936279297, 0.023087501525878906, 0.024096012115478516, 0.025104522705078125, 0.026113033294677734, 0.027121543884277344, 0.028130054473876953, 0.029138565063476562, 0.030147075653076172, 0.03115558624267578, 0.03216409683227539, 0.033172607421875]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 10.0, 51.0, 131.0, 219.0, 224.0, 202.0, 105.0, 38.0, 13.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0183563232421875, -0.017709732055664062, -0.017063140869140625, -0.016416549682617188, -0.01576995849609375, -0.015123367309570312, -0.014476776123046875, -0.013830184936523438, -0.01318359375, -0.012537002563476562, -0.011890411376953125, -0.011243820190429688, -0.01059722900390625, -0.009950637817382812, -0.009304046630859375, -0.008657455444335938, -0.0080108642578125, -0.0073642730712890625, -0.006717681884765625, -0.0060710906982421875, -0.00542449951171875, -0.0047779083251953125, -0.004131317138671875, -0.0034847259521484375, -0.002838134765625, -0.0021915435791015625, -0.001544952392578125, -0.0008983612060546875, -0.00025177001953125, 0.0003948211669921875, 0.001041412353515625, 0.0016880035400390625, 0.0023345947265625, 0.0029811859130859375, 0.003627777099609375, 0.0042743682861328125, 0.00492095947265625, 0.0055675506591796875, 0.006214141845703125, 0.0068607330322265625, 0.00750732421875, 0.008153915405273438, 0.008800506591796875, 0.009447097778320312, 0.01009368896484375, 0.010740280151367188, 0.011386871337890625, 0.012033462524414062, 0.0126800537109375, 0.013326644897460938, 0.013973236083984375, 0.014619827270507812, 0.01526641845703125, 0.015913009643554688, 0.016559600830078125, 0.017206192016601562, 0.017852783203125, 0.018499374389648438, 0.019145965576171875, 0.019792556762695312, 0.02043914794921875, 0.021085739135742188, 0.021732330322265625, 0.022378921508789062, 0.0230255126953125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 6.0, 9.0, 10.0, 10.0, 19.0, 32.0, 42.0, 87.0, 137.0, 234.0, 378.0, 803.0, 1704.0, 4691.0, 21278.0, 228531.0, 3821579.0, 95877.0, 13028.0, 3289.0, 1235.0, 565.0, 282.0, 175.0, 94.0, 66.0, 39.0, 31.0, 30.0, 6.0, 4.0, 6.0, 12.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013946533203125, -0.013486981391906738, -0.013027429580688477, -0.012567877769470215, -0.012108325958251953, -0.011648774147033691, -0.01118922233581543, -0.010729670524597168, -0.010270118713378906, -0.009810566902160645, -0.009351015090942383, -0.008891463279724121, -0.00843191146850586, -0.007972359657287598, -0.007512807846069336, -0.007053256034851074, -0.0065937042236328125, -0.006134152412414551, -0.005674600601196289, -0.005215048789978027, -0.004755496978759766, -0.004295945167541504, -0.003836393356323242, -0.0033768415451049805, -0.0029172897338867188, -0.002457737922668457, -0.0019981861114501953, -0.0015386343002319336, -0.0010790824890136719, -0.0006195306777954102, -0.00015997886657714844, 0.0002995729446411133, 0.000759124755859375, 0.0012186765670776367, 0.0016782283782958984, 0.00213778018951416, 0.002597332000732422, 0.0030568838119506836, 0.0035164356231689453, 0.003975987434387207, 0.004435539245605469, 0.0048950910568237305, 0.005354642868041992, 0.005814194679260254, 0.006273746490478516, 0.006733298301696777, 0.007192850112915039, 0.007652401924133301, 0.008111953735351562, 0.008571505546569824, 0.009031057357788086, 0.009490609169006348, 0.00995016098022461, 0.010409712791442871, 0.010869264602661133, 0.011328816413879395, 0.011788368225097656, 0.012247920036315918, 0.01270747184753418, 0.013167023658752441, 0.013626575469970703, 0.014086127281188965, 0.014545679092407227, 0.015005230903625488, 0.01546478271484375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 7.0, 10.0, 19.0, 22.0, 42.0, 80.0, 147.0, 826.0, 1896.0, 529.0, 208.0, 95.0, 54.0, 54.0, 27.0, 17.0, 11.0, 8.0, 7.0, 4.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01201629638671875, -0.011710822582244873, -0.011405348777770996, -0.01109987497329712, -0.010794401168823242, -0.010488927364349365, -0.010183453559875488, -0.009877979755401611, -0.009572505950927734, -0.009267032146453857, -0.00896155834197998, -0.008656084537506104, -0.008350610733032227, -0.00804513692855835, -0.007739663124084473, -0.007434189319610596, -0.007128715515136719, -0.006823241710662842, -0.006517767906188965, -0.006212294101715088, -0.005906820297241211, -0.005601346492767334, -0.005295872688293457, -0.00499039888381958, -0.004684925079345703, -0.004379451274871826, -0.004073977470397949, -0.0037685036659240723, -0.0034630298614501953, -0.0031575560569763184, -0.0028520822525024414, -0.0025466084480285645, -0.0022411346435546875, -0.0019356608390808105, -0.0016301870346069336, -0.0013247132301330566, -0.0010192394256591797, -0.0007137656211853027, -0.0004082918167114258, -0.00010281801223754883, 0.00020265579223632812, 0.0005081295967102051, 0.000813603401184082, 0.001119077205657959, 0.001424551010131836, 0.0017300248146057129, 0.00203549861907959, 0.002340972423553467, 0.0026464462280273438, 0.0029519200325012207, 0.0032573938369750977, 0.0035628676414489746, 0.0038683414459228516, 0.0041738152503967285, 0.0044792890548706055, 0.004784762859344482, 0.005090236663818359, 0.005395710468292236, 0.005701184272766113, 0.00600665807723999, 0.006312131881713867, 0.006617605686187744, 0.006923079490661621, 0.007228553295135498, 0.007534027099609375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 24.0, 344.0, 530.0, 89.0, 17.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2103511542081833, -0.20597201585769653, -0.20159286260604858, -0.19721372425556183, -0.19283458590507507, -0.18845544755458832, -0.18407630920410156, -0.1796971559524536, -0.17531801760196686, -0.1709388792514801, -0.16655972599983215, -0.1621805876493454, -0.15780144929885864, -0.1534223109483719, -0.14904317259788513, -0.14466401934623718, -0.14028488099575043, -0.13590574264526367, -0.13152658939361572, -0.12714745104312897, -0.12276831269264221, -0.11838917434215546, -0.1140100285410881, -0.10963088274002075, -0.105251744389534, -0.10087260603904724, -0.09649346023797989, -0.09211431443691254, -0.08773517608642578, -0.08335603773593903, -0.07897689193487167, -0.07459774613380432, -0.07021862268447876, -0.065839484333992, -0.06146033853292465, -0.0570811964571476, -0.052702054381370544, -0.04832291230559349, -0.04394377022981644, -0.03956462815403938, -0.03518548607826233, -0.030806344002485275, -0.02642720192670822, -0.022048059850931168, -0.017668917775154114, -0.01328977569937706, -0.008910633623600006, -0.004531491547822952, -0.00015234947204589844, 0.004226792603731155, 0.00860593467950821, 0.012985076755285263, 0.017364218831062317, 0.02174336090683937, 0.026122502982616425, 0.03050164505839348, 0.03488078713417053, 0.039259929209947586, 0.04363907128572464, 0.048018213361501694, 0.05239735543727875, 0.0567764975130558, 0.061155639588832855, 0.06553478538990021, 0.06991392374038696]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 9.0, 5.0, 9.0, 11.0, 13.0, 8.0, 18.0, 11.0, 28.0, 23.0, 28.0, 29.0, 18.0, 26.0, 32.0, 25.0, 34.0, 37.0, 31.0, 46.0, 34.0, 37.0, 43.0, 36.0, 33.0, 34.0, 34.0, 36.0, 33.0, 35.0, 34.0, 29.0, 20.0, 20.0, 22.0, 13.0, 16.0, 8.0, 14.0, 3.0, 8.0, 5.0, 3.0, 9.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.020189642906188965, -0.01961723156273365, -0.019044820219278336, -0.01847240887582302, -0.017899997532367706, -0.01732758618891239, -0.016755174845457077, -0.016182763502001762, -0.015610352158546448, -0.015037940815091133, -0.014465529471635818, -0.013893118128180504, -0.01332070678472519, -0.012748295441269875, -0.01217588409781456, -0.011603472754359245, -0.01103106141090393, -0.010458650067448616, -0.009886238723993301, -0.009313827380537987, -0.008741416037082672, -0.008169004693627357, -0.007596593350172043, -0.007024182006716728, -0.006451770663261414, -0.005879359319806099, -0.005306947976350784, -0.00473453663289547, -0.004162125289440155, -0.0035897139459848404, -0.0030173026025295258, -0.002444891259074211, -0.0018724799156188965, -0.0013000685721635818, -0.0007276572287082672, -0.00015524588525295258, 0.00041716545820236206, 0.0009895768016576767, 0.0015619881451129913, 0.002134399488568306, 0.0027068108320236206, 0.0032792221754789352, 0.00385163351893425, 0.0044240448623895645, 0.004996456205844879, 0.005568867549300194, 0.006141278892755508, 0.006713690236210823, 0.007286101579666138, 0.007858512923121452, 0.008430924266576767, 0.009003335610032082, 0.009575746953487396, 0.010148158296942711, 0.010720569640398026, 0.01129298098385334, 0.011865392327308655, 0.01243780367076397, 0.013010215014219284, 0.013582626357674599, 0.014155037701129913, 0.014727449044585228, 0.015299860388040543, 0.015872271731495857, 0.016444683074951172]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 5.0, 12.0, 8.0, 7.0, 13.0, 17.0, 26.0, 39.0, 42.0, 49.0, 102.0, 129.0, 191.0, 275.0, 334.0, 524.0, 768.0, 1402.0, 3965.0, 30919.0, 661196.0, 326751.0, 15573.0, 2771.0, 1077.0, 697.0, 466.0, 318.0, 222.0, 201.0, 119.0, 99.0, 66.0, 44.0, 27.0, 22.0, 24.0, 19.0, 9.0, 9.0, 6.0, 6.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0207366943359375, -0.020064830780029297, -0.019392967224121094, -0.01872110366821289, -0.018049240112304688, -0.017377376556396484, -0.01670551300048828, -0.016033649444580078, -0.015361785888671875, -0.014689922332763672, -0.014018058776855469, -0.013346195220947266, -0.012674331665039062, -0.01200246810913086, -0.011330604553222656, -0.010658740997314453, -0.00998687744140625, -0.009315013885498047, -0.008643150329589844, -0.00797128677368164, -0.0072994232177734375, -0.006627559661865234, -0.005955696105957031, -0.005283832550048828, -0.004611968994140625, -0.003940105438232422, -0.0032682418823242188, -0.0025963783264160156, -0.0019245147705078125, -0.0012526512145996094, -0.0005807876586914062, 9.107589721679688e-05, 0.000762939453125, 0.0014348030090332031, 0.0021066665649414062, 0.0027785301208496094, 0.0034503936767578125, 0.004122257232666016, 0.004794120788574219, 0.005465984344482422, 0.006137847900390625, 0.006809711456298828, 0.007481575012207031, 0.008153438568115234, 0.008825302124023438, 0.00949716567993164, 0.010169029235839844, 0.010840892791748047, 0.01151275634765625, 0.012184619903564453, 0.012856483459472656, 0.01352834701538086, 0.014200210571289062, 0.014872074127197266, 0.015543937683105469, 0.016215801239013672, 0.016887664794921875, 0.017559528350830078, 0.01823139190673828, 0.018903255462646484, 0.019575119018554688, 0.02024698257446289, 0.020918846130371094, 0.021590709686279297, 0.0222625732421875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 14.0, 50.0, 126.0, 210.0, 233.0, 200.0, 104.0, 39.0, 17.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.01898193359375, -0.018336772918701172, -0.017691612243652344, -0.017046451568603516, -0.016401290893554688, -0.01575613021850586, -0.015110969543457031, -0.014465808868408203, -0.013820648193359375, -0.013175487518310547, -0.012530326843261719, -0.01188516616821289, -0.011240005493164062, -0.010594844818115234, -0.009949684143066406, -0.009304523468017578, -0.00865936279296875, -0.008014202117919922, -0.007369041442871094, -0.006723880767822266, -0.0060787200927734375, -0.005433559417724609, -0.004788398742675781, -0.004143238067626953, -0.003498077392578125, -0.002852916717529297, -0.0022077560424804688, -0.0015625953674316406, -0.0009174346923828125, -0.0002722740173339844, 0.00037288665771484375, 0.0010180473327636719, 0.0016632080078125, 0.002308368682861328, 0.0029535293579101562, 0.0035986900329589844, 0.0042438507080078125, 0.004889011383056641, 0.005534172058105469, 0.006179332733154297, 0.006824493408203125, 0.007469654083251953, 0.008114814758300781, 0.00875997543334961, 0.009405136108398438, 0.010050296783447266, 0.010695457458496094, 0.011340618133544922, 0.01198577880859375, 0.012630939483642578, 0.013276100158691406, 0.013921260833740234, 0.014566421508789062, 0.01521158218383789, 0.01585674285888672, 0.016501903533935547, 0.017147064208984375, 0.017792224884033203, 0.01843738555908203, 0.01908254623413086, 0.019727706909179688, 0.020372867584228516, 0.021018028259277344, 0.021663188934326172, 0.022308349609375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 10.0, 7.0, 9.0, 11.0, 20.0, 23.0, 36.0, 32.0, 37.0, 41.0, 59.0, 82.0, 109.0, 170.0, 296.0, 653.0, 1836.0, 7421.0, 42044.0, 333350.0, 558462.0, 85584.0, 13173.0, 3052.0, 934.0, 356.0, 202.0, 118.0, 73.0, 45.0, 39.0, 48.0, 44.0, 22.0, 24.0, 16.0, 14.0, 13.0, 17.0, 10.0, 12.0, 9.0, 8.0, 8.0, 10.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012542724609375, -0.012140393257141113, -0.011738061904907227, -0.01133573055267334, -0.010933399200439453, -0.010531067848205566, -0.01012873649597168, -0.009726405143737793, -0.009324073791503906, -0.00892174243927002, -0.008519411087036133, -0.008117079734802246, -0.007714748382568359, -0.007312417030334473, -0.006910085678100586, -0.006507754325866699, -0.0061054229736328125, -0.005703091621398926, -0.005300760269165039, -0.004898428916931152, -0.004496097564697266, -0.004093766212463379, -0.003691434860229492, -0.0032891035079956055, -0.0028867721557617188, -0.002484440803527832, -0.0020821094512939453, -0.0016797780990600586, -0.0012774467468261719, -0.0008751153945922852, -0.00047278404235839844, -7.045269012451172e-05, 0.000331878662109375, 0.0007342100143432617, 0.0011365413665771484, 0.0015388727188110352, 0.0019412040710449219, 0.0023435354232788086, 0.0027458667755126953, 0.003148198127746582, 0.0035505294799804688, 0.0039528608322143555, 0.004355192184448242, 0.004757523536682129, 0.005159854888916016, 0.005562186241149902, 0.005964517593383789, 0.006366848945617676, 0.0067691802978515625, 0.007171511650085449, 0.007573843002319336, 0.007976174354553223, 0.00837850570678711, 0.008780837059020996, 0.009183168411254883, 0.00958549976348877, 0.009987831115722656, 0.010390162467956543, 0.01079249382019043, 0.011194825172424316, 0.011597156524658203, 0.01199948787689209, 0.012401819229125977, 0.012804150581359863, 0.01320648193359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 2.0, 8.0, 8.0, 7.0, 7.0, 8.0, 3.0, 18.0, 22.0, 17.0, 24.0, 17.0, 36.0, 37.0, 40.0, 30.0, 41.0, 55.0, 46.0, 40.0, 45.0, 45.0, 53.0, 44.0, 38.0, 44.0, 40.0, 49.0, 27.0, 28.0, 31.0, 20.0, 9.0, 19.0, 6.0, 10.0, 6.0, 6.0, 6.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0129241943359375, -0.012560725212097168, -0.012197256088256836, -0.011833786964416504, -0.011470317840576172, -0.01110684871673584, -0.010743379592895508, -0.010379910469055176, -0.010016441345214844, -0.009652972221374512, -0.00928950309753418, -0.008926033973693848, -0.008562564849853516, -0.008199095726013184, -0.007835626602172852, -0.0074721574783325195, -0.0071086883544921875, -0.0067452192306518555, -0.0063817501068115234, -0.006018280982971191, -0.005654811859130859, -0.005291342735290527, -0.004927873611450195, -0.004564404487609863, -0.004200935363769531, -0.0038374662399291992, -0.003473997116088867, -0.003110527992248535, -0.002747058868408203, -0.002383589744567871, -0.002020120620727539, -0.001656651496887207, -0.001293182373046875, -0.000929713249206543, -0.0005662441253662109, -0.0002027750015258789, 0.00016069412231445312, 0.0005241632461547852, 0.0008876323699951172, 0.0012511014938354492, 0.0016145706176757812, 0.0019780397415161133, 0.0023415088653564453, 0.0027049779891967773, 0.0030684471130371094, 0.0034319162368774414, 0.0037953853607177734, 0.0041588544845581055, 0.0045223236083984375, 0.0048857927322387695, 0.0052492618560791016, 0.005612730979919434, 0.005976200103759766, 0.006339669227600098, 0.00670313835144043, 0.007066607475280762, 0.007430076599121094, 0.007793545722961426, 0.008157014846801758, 0.00852048397064209, 0.008883953094482422, 0.009247422218322754, 0.009610891342163086, 0.009974360466003418, 0.01033782958984375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 6.0, 5.0, 17.0, 5.0, 16.0, 25.0, 25.0, 51.0, 85.0, 121.0, 208.0, 361.0, 672.0, 1258.0, 2616.0, 5682.0, 13857.0, 37808.0, 134355.0, 491130.0, 260344.0, 63382.0, 20932.0, 8192.0, 3626.0, 1738.0, 893.0, 468.0, 278.0, 137.0, 107.0, 47.0, 29.0, 21.0, 24.0, 13.0, 11.0, 5.0, 7.0, 1.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0030117034912109375, -0.0029167532920837402, -0.002821803092956543, -0.0027268528938293457, -0.0026319026947021484, -0.002536952495574951, -0.002442002296447754, -0.0023470520973205566, -0.0022521018981933594, -0.002157151699066162, -0.002062201499938965, -0.0019672513008117676, -0.0018723011016845703, -0.001777350902557373, -0.0016824007034301758, -0.0015874505043029785, -0.0014925003051757812, -0.001397550106048584, -0.0013025999069213867, -0.0012076497077941895, -0.0011126995086669922, -0.001017749309539795, -0.0009227991104125977, -0.0008278489112854004, -0.0007328987121582031, -0.0006379485130310059, -0.0005429983139038086, -0.00044804811477661133, -0.00035309791564941406, -0.0002581477165222168, -0.00016319751739501953, -6.824731826782227e-05, 2.6702880859375e-05, 0.00012165307998657227, 0.00021660327911376953, 0.0003115534782409668, 0.00040650367736816406, 0.0005014538764953613, 0.0005964040756225586, 0.0006913542747497559, 0.0007863044738769531, 0.0008812546730041504, 0.0009762048721313477, 0.001071155071258545, 0.0011661052703857422, 0.0012610554695129395, 0.0013560056686401367, 0.001450955867767334, 0.0015459060668945312, 0.0016408562660217285, 0.0017358064651489258, 0.001830756664276123, 0.0019257068634033203, 0.0020206570625305176, 0.002115607261657715, 0.002210557460784912, 0.0023055076599121094, 0.0024004578590393066, 0.002495408058166504, 0.002590358257293701, 0.0026853084564208984, 0.0027802586555480957, 0.002875208854675293, 0.0029701590538024902, 0.0030651092529296875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 12.0, 15.0, 15.0, 31.0, 45.0, 51.0, 59.0, 88.0, 91.0, 118.0, 102.0, 91.0, 64.0, 75.0, 46.0, 45.0, 18.0, 12.0, 12.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015211105346679688, -0.00014808028936386108, -0.0001440495252609253, -0.0001400187611579895, -0.0001359879970550537, -0.00013195723295211792, -0.00012792646884918213, -0.00012389570474624634, -0.00011986494064331055, -0.00011583417654037476, -0.00011180341243743896, -0.00010777264833450317, -0.00010374188423156738, -9.971112012863159e-05, -9.56803560256958e-05, -9.164959192276001e-05, -8.761882781982422e-05, -8.358806371688843e-05, -7.955729961395264e-05, -7.552653551101685e-05, -7.149577140808105e-05, -6.746500730514526e-05, -6.343424320220947e-05, -5.940347909927368e-05, -5.537271499633789e-05, -5.13419508934021e-05, -4.731118679046631e-05, -4.328042268753052e-05, -3.9249658584594727e-05, -3.5218894481658936e-05, -3.1188130378723145e-05, -2.7157366275787354e-05, -2.3126602172851562e-05, -1.909583806991577e-05, -1.506507396697998e-05, -1.103430986404419e-05, -7.0035457611083984e-06, -2.9727816581726074e-06, 1.0579824447631836e-06, 5.088746547698975e-06, 9.119510650634766e-06, 1.3150274753570557e-05, 1.7181038856506348e-05, 2.121180295944214e-05, 2.524256706237793e-05, 2.927333116531372e-05, 3.330409526824951e-05, 3.73348593711853e-05, 4.1365623474121094e-05, 4.5396387577056885e-05, 4.9427151679992676e-05, 5.345791578292847e-05, 5.748867988586426e-05, 6.151944398880005e-05, 6.555020809173584e-05, 6.958097219467163e-05, 7.361173629760742e-05, 7.764250040054321e-05, 8.1673264503479e-05, 8.57040286064148e-05, 8.973479270935059e-05, 9.376555681228638e-05, 9.779632091522217e-05, 0.00010182708501815796, 0.00010585784912109375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 6.0, 2.0, 14.0, 13.0, 14.0, 28.0, 66.0, 154.0, 386.0, 1142.0, 4479.0, 28371.0, 530886.0, 451226.0, 25810.0, 4219.0, 1042.0, 391.0, 161.0, 66.0, 26.0, 17.0, 14.0, 8.0, 8.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00800323486328125, -0.007760524749755859, -0.007517814636230469, -0.007275104522705078, -0.0070323944091796875, -0.006789684295654297, -0.006546974182128906, -0.006304264068603516, -0.006061553955078125, -0.005818843841552734, -0.005576133728027344, -0.005333423614501953, -0.0050907135009765625, -0.004848003387451172, -0.004605293273925781, -0.004362583160400391, -0.004119873046875, -0.0038771629333496094, -0.0036344528198242188, -0.003391742706298828, -0.0031490325927734375, -0.002906322479248047, -0.0026636123657226562, -0.0024209022521972656, -0.002178192138671875, -0.0019354820251464844, -0.0016927719116210938, -0.0014500617980957031, -0.0012073516845703125, -0.0009646415710449219, -0.0007219314575195312, -0.0004792213439941406, -0.00023651123046875, 6.198883056640625e-06, 0.00024890899658203125, 0.0004916191101074219, 0.0007343292236328125, 0.0009770393371582031, 0.0012197494506835938, 0.0014624595642089844, 0.001705169677734375, 0.0019478797912597656, 0.0021905899047851562, 0.002433300018310547, 0.0026760101318359375, 0.002918720245361328, 0.0031614303588867188, 0.0034041404724121094, 0.0036468505859375, 0.0038895606994628906, 0.004132270812988281, 0.004374980926513672, 0.0046176910400390625, 0.004860401153564453, 0.005103111267089844, 0.005345821380615234, 0.005588531494140625, 0.005831241607666016, 0.006073951721191406, 0.006316661834716797, 0.0065593719482421875, 0.006802082061767578, 0.007044792175292969, 0.007287502288818359, 0.00753021240234375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 7.0, 0.0, 7.0, 2.0, 3.0, 5.0, 12.0, 12.0, 15.0, 27.0, 37.0, 29.0, 83.0, 85.0, 146.0, 129.0, 145.0, 82.0, 58.0, 31.0, 18.0, 15.0, 12.0, 17.0, 11.0, 4.0, 3.0, 6.0, 4.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005512237548828125, -0.005355894565582275, -0.005199551582336426, -0.005043208599090576, -0.0048868656158447266, -0.004730522632598877, -0.004574179649353027, -0.004417836666107178, -0.004261493682861328, -0.0041051506996154785, -0.003948807716369629, -0.0037924647331237793, -0.0036361217498779297, -0.00347977876663208, -0.0033234357833862305, -0.003167092800140381, -0.0030107498168945312, -0.0028544068336486816, -0.002698063850402832, -0.0025417208671569824, -0.002385377883911133, -0.002229034900665283, -0.0020726919174194336, -0.001916348934173584, -0.0017600059509277344, -0.0016036629676818848, -0.0014473199844360352, -0.0012909770011901855, -0.001134634017944336, -0.0009782910346984863, -0.0008219480514526367, -0.0006656050682067871, -0.0005092620849609375, -0.0003529191017150879, -0.00019657611846923828, -4.023313522338867e-05, 0.00011610984802246094, 0.00027245283126831055, 0.00042879581451416016, 0.0005851387977600098, 0.0007414817810058594, 0.000897824764251709, 0.0010541677474975586, 0.0012105107307434082, 0.0013668537139892578, 0.0015231966972351074, 0.001679539680480957, 0.0018358826637268066, 0.0019922256469726562, 0.002148568630218506, 0.0023049116134643555, 0.002461254596710205, 0.0026175975799560547, 0.0027739405632019043, 0.002930283546447754, 0.0030866265296936035, 0.003242969512939453, 0.0033993124961853027, 0.0035556554794311523, 0.003711998462677002, 0.0038683414459228516, 0.004024684429168701, 0.004181027412414551, 0.0043373703956604, 0.00449371337890625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 16.0, 975.0, 27.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07159274816513062, -0.05123282968997955, -0.03087291121482849, -0.01051299273967743, 0.009846925735473633, 0.030206844210624695, 0.05056676268577576, 0.07092668116092682, 0.09128659963607788, 0.11164651811122894, 0.13200643658638, 0.15236635506153107, 0.17272627353668213, 0.1930861920118332, 0.21344611048698425, 0.23380602896213531, 0.2541659474372864, 0.27452588081359863, 0.2948857843875885, 0.31524568796157837, 0.3356056213378906, 0.3559655547142029, 0.37632545828819275, 0.3966853618621826, 0.4170452952384949, 0.43740522861480713, 0.457765132188797, 0.47812503576278687, 0.4984849691390991, 0.5188449025154114, 0.5392048358917236, 0.5595647096633911, 0.5799245834350586, 0.6002845168113708, 0.6206444501876831, 0.6410043239593506, 0.6613642573356628, 0.6817241907119751, 0.7020840644836426, 0.7224439978599548, 0.7428039312362671, 0.7631638646125793, 0.7835237979888916, 0.8038836717605591, 0.8242436051368713, 0.8446035385131836, 0.8649634122848511, 0.8853233456611633, 0.9056832790374756, 0.9260432124137878, 0.9464031457901001, 0.9667630195617676, 0.9871229529380798, 1.007482886314392, 1.0278427600860596, 1.0482027530670166, 1.068562626838684, 1.0889225006103516, 1.1092824935913086, 1.129642367362976, 1.1500022411346436, 1.1703622341156006, 1.190722107887268, 1.211082100868225, 1.2314419746398926]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 7.0, 14.0, 12.0, 22.0, 15.0, 27.0, 39.0, 36.0, 50.0, 58.0, 56.0, 57.0, 49.0, 64.0, 72.0, 59.0, 65.0, 50.0, 45.0, 46.0, 33.0, 32.0, 28.0, 13.0, 18.0, 10.0, 13.0, 9.0, 2.0, 4.0, 0.0, 4.0, 3.0], "bins": [-0.07052725553512573, -0.0689583271741867, -0.06738939881324768, -0.06582047045230865, -0.06425154209136963, -0.06268260627985, -0.06111367791891098, -0.059544749557971954, -0.05797582119703293, -0.0564068928360939, -0.05483796447515488, -0.05326903238892555, -0.051700104027986526, -0.0501311756670475, -0.048562243580818176, -0.04699331521987915, -0.045424386858940125, -0.0438554584980011, -0.04228653013706207, -0.04071759805083275, -0.03914866968989372, -0.0375797413289547, -0.03601080924272537, -0.034441880881786346, -0.03287295252084732, -0.031304024159908295, -0.02973509393632412, -0.028166163712739944, -0.02659723535180092, -0.025028306990861893, -0.023459376767277718, -0.021890446543693542, -0.020321518182754517, -0.01875258982181549, -0.017183659598231316, -0.015614730305969715, -0.014045801013708115, -0.012476871721446514, -0.010907942429184914, -0.009339013136923313, -0.007770083844661713, -0.006201154552400112, -0.004632225260138512, -0.003063295967876911, -0.0014943666756153107, 7.456261664628983e-05, 0.0016434919089078903, 0.003212421201169491, 0.004781350493431091, 0.006350279785692692, 0.007919209077954292, 0.009488138370215893, 0.011057067662477493, 0.012625996954739094, 0.014194926247000694, 0.01576385647058487, 0.017332784831523895, 0.01890171319246292, 0.020470643416047096, 0.02203957363963127, 0.023608502000570297, 0.025177430361509323, 0.026746360585093498, 0.028315290808677673, 0.0298842191696167]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 4.0, 14.0, 6.0, 9.0, 12.0, 15.0, 32.0, 51.0, 77.0, 150.0, 255.0, 723.0, 2450.0, 10498.0, 4043204.0, 129779.0, 5194.0, 1108.0, 299.0, 153.0, 70.0, 44.0, 38.0, 25.0, 16.0, 14.0, 11.0, 3.0, 3.0, 6.0, 5.0, 4.0, 5.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0302276611328125, -0.02905583381652832, -0.02788400650024414, -0.02671217918395996, -0.02554035186767578, -0.0243685245513916, -0.023196697235107422, -0.022024869918823242, -0.020853042602539062, -0.019681215286254883, -0.018509387969970703, -0.017337560653686523, -0.016165733337402344, -0.014993906021118164, -0.013822078704833984, -0.012650251388549805, -0.011478424072265625, -0.010306596755981445, -0.009134769439697266, -0.007962942123413086, -0.006791114807128906, -0.0056192874908447266, -0.004447460174560547, -0.003275632858276367, -0.0021038055419921875, -0.0009319782257080078, 0.00023984909057617188, 0.0014116764068603516, 0.0025835037231445312, 0.003755331039428711, 0.004927158355712891, 0.00609898567199707, 0.00727081298828125, 0.00844264030456543, 0.00961446762084961, 0.010786294937133789, 0.011958122253417969, 0.013129949569702148, 0.014301776885986328, 0.015473604202270508, 0.016645431518554688, 0.017817258834838867, 0.018989086151123047, 0.020160913467407227, 0.021332740783691406, 0.022504568099975586, 0.023676395416259766, 0.024848222732543945, 0.026020050048828125, 0.027191877365112305, 0.028363704681396484, 0.029535531997680664, 0.030707359313964844, 0.03187918663024902, 0.0330510139465332, 0.03422284126281738, 0.03539466857910156, 0.03656649589538574, 0.03773832321166992, 0.0389101505279541, 0.04008197784423828, 0.04125380516052246, 0.04242563247680664, 0.04359745979309082, 0.044769287109375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 18.0, 58.0, 140.0, 216.0, 226.0, 183.0, 101.0, 32.0, 17.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.018218994140625, -0.01759791374206543, -0.01697683334350586, -0.01635575294494629, -0.01573467254638672, -0.015113592147827148, -0.014492511749267578, -0.013871431350708008, -0.013250350952148438, -0.012629270553588867, -0.012008190155029297, -0.011387109756469727, -0.010766029357910156, -0.010144948959350586, -0.009523868560791016, -0.008902788162231445, -0.008281707763671875, -0.007660627365112305, -0.007039546966552734, -0.006418466567993164, -0.005797386169433594, -0.0051763057708740234, -0.004555225372314453, -0.003934144973754883, -0.0033130645751953125, -0.002691984176635742, -0.002070903778076172, -0.0014498233795166016, -0.0008287429809570312, -0.00020766258239746094, 0.0004134178161621094, 0.0010344982147216797, 0.00165557861328125, 0.0022766590118408203, 0.0028977394104003906, 0.003518819808959961, 0.004139900207519531, 0.0047609806060791016, 0.005382061004638672, 0.006003141403198242, 0.0066242218017578125, 0.007245302200317383, 0.007866382598876953, 0.008487462997436523, 0.009108543395996094, 0.009729623794555664, 0.010350704193115234, 0.010971784591674805, 0.011592864990234375, 0.012213945388793945, 0.012835025787353516, 0.013456106185913086, 0.014077186584472656, 0.014698266983032227, 0.015319347381591797, 0.015940427780151367, 0.016561508178710938, 0.017182588577270508, 0.017803668975830078, 0.01842474937438965, 0.01904582977294922, 0.01966691017150879, 0.02028799057006836, 0.02090907096862793, 0.0215301513671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 4.0, 9.0, 9.0, 10.0, 9.0, 20.0, 29.0, 44.0, 60.0, 64.0, 72.0, 97.0, 146.0, 193.0, 268.0, 450.0, 754.0, 1466.0, 3598.0, 11160.0, 48682.0, 619342.0, 3388379.0, 91343.0, 18058.0, 5362.0, 2078.0, 908.0, 523.0, 319.0, 224.0, 167.0, 108.0, 79.0, 60.0, 51.0, 30.0, 25.0, 14.0, 19.0, 16.0, 13.0, 9.0, 4.0, 4.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.01117706298828125, -0.010849952697753906, -0.010522842407226562, -0.010195732116699219, -0.009868621826171875, -0.009541511535644531, -0.009214401245117188, -0.008887290954589844, -0.0085601806640625, -0.008233070373535156, -0.007905960083007812, -0.007578849792480469, -0.007251739501953125, -0.006924629211425781, -0.0065975189208984375, -0.006270408630371094, -0.00594329833984375, -0.005616188049316406, -0.0052890777587890625, -0.004961967468261719, -0.004634857177734375, -0.004307746887207031, -0.0039806365966796875, -0.0036535263061523438, -0.003326416015625, -0.0029993057250976562, -0.0026721954345703125, -0.0023450851440429688, -0.002017974853515625, -0.0016908645629882812, -0.0013637542724609375, -0.0010366439819335938, -0.00070953369140625, -0.00038242340087890625, -5.53131103515625e-05, 0.00027179718017578125, 0.000598907470703125, 0.0009260177612304688, 0.0012531280517578125, 0.0015802383422851562, 0.0019073486328125, 0.0022344589233398438, 0.0025615692138671875, 0.0028886795043945312, 0.003215789794921875, 0.0035429000854492188, 0.0038700103759765625, 0.004197120666503906, 0.00452423095703125, 0.004851341247558594, 0.0051784515380859375, 0.005505561828613281, 0.005832672119140625, 0.006159782409667969, 0.0064868927001953125, 0.006814002990722656, 0.00714111328125, 0.007468223571777344, 0.0077953338623046875, 0.008122444152832031, 0.008449554443359375, 0.008776664733886719, 0.009103775024414062, 0.009430885314941406, 0.00975799560546875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 12.0, 32.0, 48.0, 97.0, 300.0, 1977.0, 1125.0, 243.0, 99.0, 51.0, 30.0, 20.0, 10.0, 5.0, 7.0, 10.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0127410888671875, -0.012395262718200684, -0.012049436569213867, -0.01170361042022705, -0.011357784271240234, -0.011011958122253418, -0.010666131973266602, -0.010320305824279785, -0.009974479675292969, -0.009628653526306152, -0.009282827377319336, -0.00893700122833252, -0.008591175079345703, -0.008245348930358887, -0.00789952278137207, -0.007553696632385254, -0.0072078704833984375, -0.006862044334411621, -0.006516218185424805, -0.006170392036437988, -0.005824565887451172, -0.0054787397384643555, -0.005132913589477539, -0.004787087440490723, -0.004441261291503906, -0.00409543514251709, -0.0037496089935302734, -0.003403782844543457, -0.0030579566955566406, -0.0027121305465698242, -0.002366304397583008, -0.0020204782485961914, -0.001674652099609375, -0.0013288259506225586, -0.0009829998016357422, -0.0006371736526489258, -0.0002913475036621094, 5.447864532470703e-05, 0.00040030479431152344, 0.0007461309432983398, 0.0010919570922851562, 0.0014377832412719727, 0.001783609390258789, 0.0021294355392456055, 0.002475261688232422, 0.0028210878372192383, 0.0031669139862060547, 0.003512740135192871, 0.0038585662841796875, 0.004204392433166504, 0.00455021858215332, 0.004896044731140137, 0.005241870880126953, 0.0055876970291137695, 0.005933523178100586, 0.006279349327087402, 0.006625175476074219, 0.006971001625061035, 0.0073168277740478516, 0.007662653923034668, 0.008008480072021484, 0.0083543062210083, 0.008700132369995117, 0.009045958518981934, 0.00939178466796875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 11.0, 41.0, 112.0, 281.0, 296.0, 156.0, 66.0, 22.0, 11.0, 7.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08237071335315704, -0.08074934780597687, -0.07912798225879669, -0.07750660926103592, -0.07588524371385574, -0.07426387816667557, -0.07264251261949539, -0.07102114707231522, -0.06939977407455444, -0.06777840852737427, -0.06615704298019409, -0.06453566998243332, -0.06291430443525314, -0.06129293888807297, -0.05967157334089279, -0.05805020406842232, -0.05642884224653244, -0.054807476699352264, -0.05318610742688179, -0.051564741879701614, -0.04994337260723114, -0.048322007060050964, -0.04670064151287079, -0.045079272240400314, -0.04345790296792984, -0.041836537420749664, -0.04021516814827919, -0.038593802601099014, -0.03697243332862854, -0.035351067781448364, -0.03372970223426819, -0.032108332961797714, -0.03048696555197239, -0.028865598142147064, -0.02724423073232174, -0.025622863322496414, -0.02400149777531624, -0.022380130365490913, -0.02075876295566559, -0.019137397408485413, -0.01751602813601494, -0.015894660726189613, -0.014273294247686863, -0.012651926837861538, -0.011030560359358788, -0.009409192949533463, -0.0077878255397081375, -0.006166459061205387, -0.004545092582702637, -0.002923725638538599, -0.0013023584615439177, 0.0003190087154507637, 0.0019403756596148014, 0.003561742603778839, 0.005183110013604164, 0.0068044764921069145, 0.00842584390193224, 0.010047211311757565, 0.011668577790260315, 0.01328994520008564, 0.014911312609910965, 0.01653267815709114, 0.018154047429561615, 0.01977541297674179, 0.021396780386567116]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 4.0, 8.0, 6.0, 6.0, 9.0, 13.0, 17.0, 15.0, 20.0, 21.0, 27.0, 23.0, 24.0, 21.0, 34.0, 30.0, 40.0, 35.0, 34.0, 42.0, 36.0, 35.0, 40.0, 30.0, 44.0, 32.0, 34.0, 35.0, 37.0, 21.0, 21.0, 20.0, 32.0, 21.0, 24.0, 14.0, 16.0, 16.0, 10.0, 9.0, 6.0, 9.0, 8.0, 8.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0], "bins": [-0.013236522674560547, -0.01282115001231432, -0.012405777350068092, -0.011990404687821865, -0.011575032025575638, -0.01115965936332941, -0.010744286701083183, -0.010328914038836956, -0.009913541376590729, -0.009498168714344501, -0.009082796052098274, -0.008667423389852047, -0.00825205072760582, -0.007836678065359592, -0.007421305403113365, -0.007005932740867138, -0.006590560078620911, -0.006175187416374683, -0.005759814754128456, -0.005344442091882229, -0.004929069429636002, -0.004513696767389774, -0.004098324105143547, -0.00368295144289732, -0.0032675787806510925, -0.0028522061184048653, -0.002436833456158638, -0.0020214607939124107, -0.0016060881316661835, -0.0011907154694199562, -0.0007753428071737289, -0.0003599701449275017, 5.5402517318725586e-05, 0.00047077517956495285, 0.0008861478418111801, 0.0013015205040574074, 0.0017168931663036346, 0.002132265828549862, 0.002547638490796089, 0.0029630111530423164, 0.0033783838152885437, 0.003793756477534771, 0.004209129139780998, 0.0046245018020272255, 0.005039874464273453, 0.00545524712651968, 0.005870619788765907, 0.0062859924510121346, 0.006701365113258362, 0.007116737775504589, 0.007532110437750816, 0.007947483099997044, 0.008362855762243271, 0.008778228424489498, 0.009193601086735725, 0.009608973748981953, 0.01002434641122818, 0.010439719073474407, 0.010855091735720634, 0.011270464397966862, 0.011685837060213089, 0.012101209722459316, 0.012516582384705544, 0.01293195504695177, 0.013347327709197998]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 5.0, 5.0, 10.0, 15.0, 11.0, 17.0, 21.0, 55.0, 67.0, 109.0, 155.0, 276.0, 377.0, 603.0, 1207.0, 3739.0, 45668.0, 924372.0, 64456.0, 4296.0, 1326.0, 658.0, 432.0, 217.0, 170.0, 83.0, 53.0, 40.0, 43.0, 15.0, 12.0, 11.0, 8.0, 5.0, 3.0, 4.0, 6.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0257720947265625, -0.024899721145629883, -0.024027347564697266, -0.02315497398376465, -0.02228260040283203, -0.021410226821899414, -0.020537853240966797, -0.01966547966003418, -0.018793106079101562, -0.017920732498168945, -0.017048358917236328, -0.01617598533630371, -0.015303611755371094, -0.014431238174438477, -0.01355886459350586, -0.012686491012573242, -0.011814117431640625, -0.010941743850708008, -0.01006937026977539, -0.009196996688842773, -0.008324623107910156, -0.007452249526977539, -0.006579875946044922, -0.005707502365112305, -0.0048351287841796875, -0.00396275520324707, -0.003090381622314453, -0.002218008041381836, -0.0013456344604492188, -0.00047326087951660156, 0.0003991127014160156, 0.0012714862823486328, 0.00214385986328125, 0.003016233444213867, 0.0038886070251464844, 0.0047609806060791016, 0.005633354187011719, 0.006505727767944336, 0.007378101348876953, 0.00825047492980957, 0.009122848510742188, 0.009995222091674805, 0.010867595672607422, 0.011739969253540039, 0.012612342834472656, 0.013484716415405273, 0.01435708999633789, 0.015229463577270508, 0.016101837158203125, 0.016974210739135742, 0.01784658432006836, 0.018718957901000977, 0.019591331481933594, 0.02046370506286621, 0.021336078643798828, 0.022208452224731445, 0.023080825805664062, 0.02395319938659668, 0.024825572967529297, 0.025697946548461914, 0.02657032012939453, 0.02744269371032715, 0.028315067291259766, 0.029187440872192383, 0.030059814453125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 18.0, 76.0, 134.0, 236.0, 220.0, 174.0, 98.0, 24.0, 16.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01904296875, -0.018390178680419922, -0.017737388610839844, -0.017084598541259766, -0.016431808471679688, -0.01577901840209961, -0.015126228332519531, -0.014473438262939453, -0.013820648193359375, -0.013167858123779297, -0.012515068054199219, -0.01186227798461914, -0.011209487915039062, -0.010556697845458984, -0.009903907775878906, -0.009251117706298828, -0.00859832763671875, -0.007945537567138672, -0.007292747497558594, -0.006639957427978516, -0.0059871673583984375, -0.005334377288818359, -0.004681587219238281, -0.004028797149658203, -0.003376007080078125, -0.002723217010498047, -0.0020704269409179688, -0.0014176368713378906, -0.0007648468017578125, -0.00011205673217773438, 0.0005407333374023438, 0.0011935234069824219, 0.0018463134765625, 0.002499103546142578, 0.0031518936157226562, 0.0038046836853027344, 0.0044574737548828125, 0.005110263824462891, 0.005763053894042969, 0.006415843963623047, 0.007068634033203125, 0.007721424102783203, 0.008374214172363281, 0.00902700424194336, 0.009679794311523438, 0.010332584381103516, 0.010985374450683594, 0.011638164520263672, 0.01229095458984375, 0.012943744659423828, 0.013596534729003906, 0.014249324798583984, 0.014902114868164062, 0.01555490493774414, 0.01620769500732422, 0.016860485076904297, 0.017513275146484375, 0.018166065216064453, 0.01881885528564453, 0.01947164535522461, 0.020124435424804688, 0.020777225494384766, 0.021430015563964844, 0.022082805633544922, 0.022735595703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 4.0, 7.0, 8.0, 15.0, 20.0, 31.0, 38.0, 52.0, 85.0, 109.0, 188.0, 318.0, 529.0, 1278.0, 3397.0, 13561.0, 116275.0, 718530.0, 169468.0, 17559.0, 4084.0, 1461.0, 631.0, 321.0, 185.0, 109.0, 82.0, 56.0, 45.0, 31.0, 20.0, 13.0, 9.0, 7.0, 3.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01123046875, -0.010773420333862305, -0.01031637191772461, -0.009859323501586914, -0.009402275085449219, -0.008945226669311523, -0.008488178253173828, -0.008031129837036133, -0.0075740814208984375, -0.007117033004760742, -0.006659984588623047, -0.0062029361724853516, -0.005745887756347656, -0.005288839340209961, -0.004831790924072266, -0.00437474250793457, -0.003917694091796875, -0.0034606456756591797, -0.0030035972595214844, -0.002546548843383789, -0.0020895004272460938, -0.0016324520111083984, -0.0011754035949707031, -0.0007183551788330078, -0.0002613067626953125, 0.0001957416534423828, 0.0006527900695800781, 0.0011098384857177734, 0.0015668869018554688, 0.002023935317993164, 0.0024809837341308594, 0.0029380321502685547, 0.00339508056640625, 0.0038521289825439453, 0.004309177398681641, 0.004766225814819336, 0.005223274230957031, 0.0056803226470947266, 0.006137371063232422, 0.006594419479370117, 0.0070514678955078125, 0.007508516311645508, 0.007965564727783203, 0.008422613143920898, 0.008879661560058594, 0.009336709976196289, 0.009793758392333984, 0.01025080680847168, 0.010707855224609375, 0.01116490364074707, 0.011621952056884766, 0.012079000473022461, 0.012536048889160156, 0.012993097305297852, 0.013450145721435547, 0.013907194137573242, 0.014364242553710938, 0.014821290969848633, 0.015278339385986328, 0.015735387802124023, 0.01619243621826172, 0.016649484634399414, 0.01710653305053711, 0.017563581466674805, 0.0180206298828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 7.0, 8.0, 19.0, 21.0, 28.0, 37.0, 29.0, 45.0, 36.0, 50.0, 55.0, 74.0, 61.0, 48.0, 62.0, 66.0, 54.0, 39.0, 47.0, 49.0, 39.0, 34.0, 18.0, 28.0, 10.0, 8.0, 8.0, 7.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01873779296875, -0.018262267112731934, -0.017786741256713867, -0.0173112154006958, -0.016835689544677734, -0.016360163688659668, -0.0158846378326416, -0.015409111976623535, -0.014933586120605469, -0.014458060264587402, -0.013982534408569336, -0.01350700855255127, -0.013031482696533203, -0.012555956840515137, -0.01208043098449707, -0.011604905128479004, -0.011129379272460938, -0.010653853416442871, -0.010178327560424805, -0.009702801704406738, -0.009227275848388672, -0.008751749992370605, -0.008276224136352539, -0.007800698280334473, -0.007325172424316406, -0.00684964656829834, -0.0063741207122802734, -0.005898594856262207, -0.005423069000244141, -0.004947543144226074, -0.004472017288208008, -0.003996491432189941, -0.003520965576171875, -0.0030454397201538086, -0.002569913864135742, -0.0020943880081176758, -0.0016188621520996094, -0.001143336296081543, -0.0006678104400634766, -0.00019228458404541016, 0.00028324127197265625, 0.0007587671279907227, 0.001234292984008789, 0.0017098188400268555, 0.002185344696044922, 0.0026608705520629883, 0.0031363964080810547, 0.003611922264099121, 0.0040874481201171875, 0.004562973976135254, 0.00503849983215332, 0.005514025688171387, 0.005989551544189453, 0.0064650774002075195, 0.006940603256225586, 0.007416129112243652, 0.007891654968261719, 0.008367180824279785, 0.008842706680297852, 0.009318232536315918, 0.009793758392333984, 0.01026928424835205, 0.010744810104370117, 0.011220335960388184, 0.01169586181640625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [5.0, 2.0, 4.0, 4.0, 2.0, 6.0, 8.0, 13.0, 22.0, 18.0, 29.0, 44.0, 59.0, 99.0, 111.0, 233.0, 344.0, 510.0, 861.0, 1483.0, 2530.0, 4647.0, 8596.0, 17737.0, 38730.0, 93972.0, 238820.0, 342374.0, 172664.0, 66896.0, 28355.0, 13397.0, 6956.0, 3730.0, 2042.0, 1268.0, 734.0, 431.0, 295.0, 171.0, 121.0, 69.0, 51.0, 33.0, 29.0, 26.0, 16.0, 8.0, 5.0, 3.0, 1.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0016489028930664062, -0.0015885382890701294, -0.0015281736850738525, -0.0014678090810775757, -0.0014074444770812988, -0.001347079873085022, -0.0012867152690887451, -0.0012263506650924683, -0.0011659860610961914, -0.0011056214570999146, -0.0010452568531036377, -0.0009848922491073608, -0.000924527645111084, -0.0008641630411148071, -0.0008037984371185303, -0.0007434338331222534, -0.0006830692291259766, -0.0006227046251296997, -0.0005623400211334229, -0.000501975417137146, -0.00044161081314086914, -0.0003812462091445923, -0.00032088160514831543, -0.0002605170011520386, -0.00020015239715576172, -0.00013978779315948486, -7.942318916320801e-05, -1.9058585166931152e-05, 4.13060188293457e-05, 0.00010167062282562256, 0.00016203522682189941, 0.00022239983081817627, 0.0002827644348144531, 0.00034312903881073, 0.00040349364280700684, 0.0004638582468032837, 0.0005242228507995605, 0.0005845874547958374, 0.0006449520587921143, 0.0007053166627883911, 0.000765681266784668, 0.0008260458707809448, 0.0008864104747772217, 0.0009467750787734985, 0.0010071396827697754, 0.0010675042867660522, 0.001127868890762329, 0.001188233494758606, 0.0012485980987548828, 0.0013089627027511597, 0.0013693273067474365, 0.0014296919107437134, 0.0014900565147399902, 0.001550421118736267, 0.001610785722732544, 0.0016711503267288208, 0.0017315149307250977, 0.0017918795347213745, 0.0018522441387176514, 0.0019126087427139282, 0.001972973346710205, 0.002033337950706482, 0.002093702554702759, 0.0021540671586990356, 0.0022144317626953125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 3.0, 3.0, 6.0, 8.0, 4.0, 11.0, 10.0, 15.0, 30.0, 43.0, 60.0, 102.0, 117.0, 139.0, 141.0, 110.0, 46.0, 52.0, 32.0, 25.0, 16.0, 9.0, 4.0, 7.0, 3.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001500844955444336, -0.00014518573880195618, -0.00014028698205947876, -0.00013538822531700134, -0.00013048946857452393, -0.0001255907118320465, -0.00012069195508956909, -0.00011579319834709167, -0.00011089444160461426, -0.00010599568486213684, -0.00010109692811965942, -9.619817137718201e-05, -9.129941463470459e-05, -8.640065789222717e-05, -8.150190114974976e-05, -7.660314440727234e-05, -7.170438766479492e-05, -6.68056309223175e-05, -6.190687417984009e-05, -5.700811743736267e-05, -5.2109360694885254e-05, -4.721060395240784e-05, -4.231184720993042e-05, -3.7413090467453e-05, -3.2514333724975586e-05, -2.761557698249817e-05, -2.2716820240020752e-05, -1.7818063497543335e-05, -1.2919306755065918e-05, -8.020550012588501e-06, -3.121793270111084e-06, 1.776963472366333e-06, 6.67572021484375e-06, 1.1574476957321167e-05, 1.6473233699798584e-05, 2.1371990442276e-05, 2.6270747184753418e-05, 3.1169503927230835e-05, 3.606826066970825e-05, 4.096701741218567e-05, 4.5865774154663086e-05, 5.07645308971405e-05, 5.566328763961792e-05, 6.056204438209534e-05, 6.546080112457275e-05, 7.035955786705017e-05, 7.525831460952759e-05, 8.0157071352005e-05, 8.505582809448242e-05, 8.995458483695984e-05, 9.485334157943726e-05, 9.975209832191467e-05, 0.00010465085506439209, 0.00010954961180686951, 0.00011444836854934692, 0.00011934712529182434, 0.00012424588203430176, 0.00012914463877677917, 0.0001340433955192566, 0.000138942152261734, 0.00014384090900421143, 0.00014873966574668884, 0.00015363842248916626, 0.00015853717923164368, 0.0001634359359741211]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 11.0, 17.0, 18.0, 44.0, 58.0, 117.0, 226.0, 537.0, 1652.0, 7849.0, 61094.0, 699339.0, 250288.0, 21942.0, 3668.0, 925.0, 381.0, 159.0, 68.0, 58.0, 43.0, 18.0, 9.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0058441162109375, -0.005647778511047363, -0.0054514408111572266, -0.00525510311126709, -0.005058765411376953, -0.004862427711486816, -0.00466609001159668, -0.004469752311706543, -0.004273414611816406, -0.0040770769119262695, -0.003880739212036133, -0.003684401512145996, -0.0034880638122558594, -0.0032917261123657227, -0.003095388412475586, -0.0028990507125854492, -0.0027027130126953125, -0.0025063753128051758, -0.002310037612915039, -0.0021136999130249023, -0.0019173622131347656, -0.001721024513244629, -0.0015246868133544922, -0.0013283491134643555, -0.0011320114135742188, -0.000935673713684082, -0.0007393360137939453, -0.0005429983139038086, -0.0003466606140136719, -0.00015032291412353516, 4.601478576660156e-05, 0.00024235248565673828, 0.000438690185546875, 0.0006350278854370117, 0.0008313655853271484, 0.0010277032852172852, 0.0012240409851074219, 0.0014203786849975586, 0.0016167163848876953, 0.001813054084777832, 0.0020093917846679688, 0.0022057294845581055, 0.002402067184448242, 0.002598404884338379, 0.0027947425842285156, 0.0029910802841186523, 0.003187417984008789, 0.0033837556838989258, 0.0035800933837890625, 0.0037764310836791992, 0.003972768783569336, 0.004169106483459473, 0.004365444183349609, 0.004561781883239746, 0.004758119583129883, 0.0049544572830200195, 0.005150794982910156, 0.005347132682800293, 0.00554347038269043, 0.005739808082580566, 0.005936145782470703, 0.00613248348236084, 0.0063288211822509766, 0.006525158882141113, 0.00672149658203125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 12.0, 14.0, 11.0, 12.0, 29.0, 38.0, 40.0, 62.0, 97.0, 113.0, 147.0, 121.0, 91.0, 63.0, 40.0, 22.0, 18.0, 16.0, 15.0, 12.0, 8.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00559234619140625, -0.00544700026512146, -0.00530165433883667, -0.00515630841255188, -0.00501096248626709, -0.0048656165599823, -0.00472027063369751, -0.00457492470741272, -0.00442957878112793, -0.00428423285484314, -0.00413888692855835, -0.00399354100227356, -0.0038481950759887695, -0.0037028491497039795, -0.0035575032234191895, -0.0034121572971343994, -0.0032668113708496094, -0.0031214654445648193, -0.0029761195182800293, -0.0028307735919952393, -0.0026854276657104492, -0.002540081739425659, -0.002394735813140869, -0.002249389886856079, -0.002104043960571289, -0.001958698034286499, -0.001813352108001709, -0.001668006181716919, -0.001522660255432129, -0.0013773143291473389, -0.0012319684028625488, -0.0010866224765777588, -0.0009412765502929688, -0.0007959306240081787, -0.0006505846977233887, -0.0005052387714385986, -0.0003598928451538086, -0.00021454691886901855, -6.920099258422852e-05, 7.614493370056152e-05, 0.00022149085998535156, 0.0003668367862701416, 0.0005121827125549316, 0.0006575286388397217, 0.0008028745651245117, 0.0009482204914093018, 0.0010935664176940918, 0.0012389123439788818, 0.0013842582702636719, 0.001529604196548462, 0.001674950122833252, 0.001820296049118042, 0.001965641975402832, 0.002110987901687622, 0.002256333827972412, 0.002401679754257202, 0.002547025680541992, 0.0026923716068267822, 0.0028377175331115723, 0.0029830634593963623, 0.0031284093856811523, 0.0032737553119659424, 0.0034191012382507324, 0.0035644471645355225, 0.0037097930908203125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 12.0, 607.0, 384.0, 14.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05807831138372421, -0.046206049621105194, -0.034333787858486176, -0.022461526095867157, -0.010589264333248138, 0.0012829974293708801, 0.013155259191989899, 0.025027520954608917, 0.036899782717227936, 0.048772044479846954, 0.06064430624246597, 0.07251656800508499, 0.08438882976770401, 0.09626109153032303, 0.10813335329294205, 0.12000561505556107, 0.1318778693675995, 0.1437501311302185, 0.15562239289283752, 0.16749465465545654, 0.17936691641807556, 0.19123917818069458, 0.2031114399433136, 0.21498370170593262, 0.22685596346855164, 0.23872822523117065, 0.2506004869937897, 0.2624727487564087, 0.2743450105190277, 0.28621727228164673, 0.29808953404426575, 0.30996179580688477, 0.32183408737182617, 0.3337063491344452, 0.3455786108970642, 0.3574508726596832, 0.36932313442230225, 0.38119539618492126, 0.3930676579475403, 0.4049399197101593, 0.4168121814727783, 0.42868444323539734, 0.44055670499801636, 0.4524289667606354, 0.4643012285232544, 0.4761734902858734, 0.48804575204849243, 0.49991801381111145, 0.5117902755737305, 0.5236625671386719, 0.5355347990989685, 0.5474070310592651, 0.5592793226242065, 0.571151614189148, 0.5830238461494446, 0.5948960781097412, 0.6067683696746826, 0.618640661239624, 0.6305128931999207, 0.6423851251602173, 0.6542574167251587, 0.6661297082901001, 0.6780019402503967, 0.6898741722106934, 0.7017464637756348]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 4.0, 4.0, 6.0, 16.0, 16.0, 19.0, 17.0, 36.0, 35.0, 42.0, 43.0, 43.0, 56.0, 49.0, 66.0, 71.0, 61.0, 66.0, 65.0, 42.0, 40.0, 41.0, 30.0, 25.0, 26.0, 23.0, 22.0, 12.0, 7.0, 7.0, 4.0, 8.0, 2.0, 3.0, 3.0, 1.0], "bins": [-0.05944877862930298, -0.05809399485588074, -0.0567392073571682, -0.05538441985845566, -0.05402963608503342, -0.052674852311611176, -0.051320064812898636, -0.049965277314186096, -0.048610493540763855, -0.047255709767341614, -0.045900922268629074, -0.044546134769916534, -0.04319135099649429, -0.04183656722307205, -0.04048177972435951, -0.03912699222564697, -0.03777220845222473, -0.03641742467880249, -0.03506263718008995, -0.03370784968137741, -0.03235306590795517, -0.03099828027188778, -0.02964349463582039, -0.028288708999753, -0.026933923363685608, -0.025579137727618217, -0.024224352091550827, -0.022869566455483437, -0.021514780819416046, -0.020159995183348656, -0.018805209547281265, -0.017450423911213875, -0.016095638275146484, -0.014740852639079094, -0.013386067003011703, -0.012031281366944313, -0.010676495730876923, -0.009321710094809532, -0.007966924458742142, -0.006612138822674751, -0.005257353186607361, -0.0039025675505399704, -0.00254778191447258, -0.0011929962784051895, 0.00016178935766220093, 0.0015165749937295914, 0.002871360629796982, 0.004226146265864372, 0.005580931901931763, 0.006935717537999153, 0.008290503174066544, 0.009645288810133934, 0.011000074446201324, 0.012354860082268715, 0.013709645718336105, 0.015064431354403496, 0.016419216990470886, 0.017774002626538277, 0.019128788262605667, 0.020483573898673058, 0.021838359534740448, 0.02319314517080784, 0.02454793080687523, 0.02590271644294262, 0.02725750207901001]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 2.0, 8.0, 6.0, 4.0, 7.0, 17.0, 12.0, 32.0, 39.0, 45.0, 77.0, 99.0, 134.0, 263.0, 594.0, 1441.0, 2700.0, 9671.0, 270738.0, 3872777.0, 27790.0, 4953.0, 1515.0, 601.0, 278.0, 148.0, 97.0, 61.0, 41.0, 30.0, 24.0, 17.0, 14.0, 8.0, 11.0, 2.0, 3.0, 9.0, 6.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021636962890625, -0.020870208740234375, -0.02010345458984375, -0.019336700439453125, -0.0185699462890625, -0.017803192138671875, -0.01703643798828125, -0.016269683837890625, -0.0155029296875, -0.014736175537109375, -0.01396942138671875, -0.013202667236328125, -0.0124359130859375, -0.011669158935546875, -0.01090240478515625, -0.010135650634765625, -0.009368896484375, -0.008602142333984375, -0.00783538818359375, -0.007068634033203125, -0.0063018798828125, -0.005535125732421875, -0.00476837158203125, -0.004001617431640625, -0.00323486328125, -0.002468109130859375, -0.00170135498046875, -0.000934600830078125, -0.0001678466796875, 0.000598907470703125, 0.00136566162109375, 0.002132415771484375, 0.002899169921875, 0.003665924072265625, 0.00443267822265625, 0.005199432373046875, 0.0059661865234375, 0.006732940673828125, 0.00749969482421875, 0.008266448974609375, 0.009033203125, 0.009799957275390625, 0.01056671142578125, 0.011333465576171875, 0.0121002197265625, 0.012866973876953125, 0.01363372802734375, 0.014400482177734375, 0.015167236328125, 0.015933990478515625, 0.01670074462890625, 0.017467498779296875, 0.0182342529296875, 0.019001007080078125, 0.01976776123046875, 0.020534515380859375, 0.02130126953125, 0.022068023681640625, 0.02283477783203125, 0.023601531982421875, 0.0243682861328125, 0.025135040283203125, 0.02590179443359375, 0.026668548583984375, 0.027435302734375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 25.0, 90.0, 171.0, 228.0, 220.0, 163.0, 67.0, 19.0, 11.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0196990966796875, -0.019040584564208984, -0.01838207244873047, -0.017723560333251953, -0.017065048217773438, -0.016406536102294922, -0.015748023986816406, -0.01508951187133789, -0.014430999755859375, -0.01377248764038086, -0.013113975524902344, -0.012455463409423828, -0.011796951293945312, -0.011138439178466797, -0.010479927062988281, -0.009821414947509766, -0.00916290283203125, -0.008504390716552734, -0.007845878601074219, -0.007187366485595703, -0.0065288543701171875, -0.005870342254638672, -0.005211830139160156, -0.004553318023681641, -0.003894805908203125, -0.0032362937927246094, -0.0025777816772460938, -0.0019192695617675781, -0.0012607574462890625, -0.0006022453308105469, 5.626678466796875e-05, 0.0007147789001464844, 0.001373291015625, 0.0020318031311035156, 0.0026903152465820312, 0.003348827362060547, 0.0040073394775390625, 0.004665851593017578, 0.005324363708496094, 0.005982875823974609, 0.006641387939453125, 0.007299900054931641, 0.007958412170410156, 0.008616924285888672, 0.009275436401367188, 0.009933948516845703, 0.010592460632324219, 0.011250972747802734, 0.01190948486328125, 0.012567996978759766, 0.013226509094238281, 0.013885021209716797, 0.014543533325195312, 0.015202045440673828, 0.015860557556152344, 0.01651906967163086, 0.017177581787109375, 0.01783609390258789, 0.018494606018066406, 0.019153118133544922, 0.019811630249023438, 0.020470142364501953, 0.02112865447998047, 0.021787166595458984, 0.0224456787109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 5.0, 3.0, 6.0, 5.0, 7.0, 14.0, 15.0, 17.0, 10.0, 30.0, 40.0, 50.0, 68.0, 109.0, 146.0, 258.0, 449.0, 823.0, 1716.0, 3777.0, 11465.0, 54002.0, 968960.0, 3046578.0, 81199.0, 15533.0, 4837.0, 1902.0, 974.0, 511.0, 271.0, 155.0, 96.0, 71.0, 48.0, 32.0, 29.0, 22.0, 11.0, 14.0, 8.0, 5.0, 6.0, 2.0, 2.0, 1.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0106658935546875, -0.010333657264709473, -0.010001420974731445, -0.009669184684753418, -0.00933694839477539, -0.009004712104797363, -0.008672475814819336, -0.008340239524841309, -0.008008003234863281, -0.007675766944885254, -0.0073435306549072266, -0.007011294364929199, -0.006679058074951172, -0.0063468217849731445, -0.006014585494995117, -0.00568234920501709, -0.0053501129150390625, -0.005017876625061035, -0.004685640335083008, -0.0043534040451049805, -0.004021167755126953, -0.0036889314651489258, -0.0033566951751708984, -0.003024458885192871, -0.0026922225952148438, -0.0023599863052368164, -0.002027750015258789, -0.0016955137252807617, -0.0013632774353027344, -0.001031041145324707, -0.0006988048553466797, -0.00036656856536865234, -3.4332275390625e-05, 0.00029790401458740234, 0.0006301403045654297, 0.000962376594543457, 0.0012946128845214844, 0.0016268491744995117, 0.001959085464477539, 0.0022913217544555664, 0.0026235580444335938, 0.002955794334411621, 0.0032880306243896484, 0.0036202669143676758, 0.003952503204345703, 0.0042847394943237305, 0.004616975784301758, 0.004949212074279785, 0.0052814483642578125, 0.00561368465423584, 0.005945920944213867, 0.0062781572341918945, 0.006610393524169922, 0.006942629814147949, 0.0072748661041259766, 0.007607102394104004, 0.007939338684082031, 0.008271574974060059, 0.008603811264038086, 0.008936047554016113, 0.00926828384399414, 0.009600520133972168, 0.009932756423950195, 0.010264992713928223, 0.01059722900390625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 7.0, 5.0, 16.0, 30.0, 75.0, 109.0, 505.0, 2020.0, 876.0, 202.0, 95.0, 45.0, 20.0, 28.0, 14.0, 9.0, 5.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0170745849609375, -0.01666438579559326, -0.016254186630249023, -0.015843987464904785, -0.015433788299560547, -0.015023589134216309, -0.01461338996887207, -0.014203190803527832, -0.013792991638183594, -0.013382792472839355, -0.012972593307495117, -0.012562394142150879, -0.01215219497680664, -0.011741995811462402, -0.011331796646118164, -0.010921597480773926, -0.010511398315429688, -0.01010119915008545, -0.009690999984741211, -0.009280800819396973, -0.008870601654052734, -0.008460402488708496, -0.008050203323364258, -0.0076400041580200195, -0.007229804992675781, -0.006819605827331543, -0.006409406661987305, -0.005999207496643066, -0.005589008331298828, -0.00517880916595459, -0.0047686100006103516, -0.004358410835266113, -0.003948211669921875, -0.0035380125045776367, -0.0031278133392333984, -0.00271761417388916, -0.002307415008544922, -0.0018972158432006836, -0.0014870166778564453, -0.001076817512512207, -0.0006666183471679688, -0.00025641918182373047, 0.0001537799835205078, 0.0005639791488647461, 0.0009741783142089844, 0.0013843774795532227, 0.001794576644897461, 0.0022047758102416992, 0.0026149749755859375, 0.0030251741409301758, 0.003435373306274414, 0.0038455724716186523, 0.004255771636962891, 0.004665970802307129, 0.005076169967651367, 0.0054863691329956055, 0.005896568298339844, 0.006306767463684082, 0.00671696662902832, 0.007127165794372559, 0.007537364959716797, 0.007947564125061035, 0.008357763290405273, 0.008767962455749512, 0.00917816162109375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 5.0, 4.0, 27.0, 47.0, 161.0, 362.0, 261.0, 96.0, 27.0, 13.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1007395014166832, -0.0984795019030571, -0.0962194949388504, -0.0939594954252243, -0.0916994959115982, -0.0894394963979721, -0.08717949688434601, -0.08491948992013931, -0.08265949040651321, -0.08039949089288712, -0.07813948392868042, -0.07587948441505432, -0.07361948490142822, -0.07135948538780212, -0.06909948587417603, -0.06683947890996933, -0.06457947939634323, -0.06231947988271713, -0.060059476643800735, -0.05779947340488434, -0.05553947389125824, -0.05327947437763214, -0.051019471138715744, -0.04875946789979935, -0.04649946838617325, -0.04423946887254715, -0.04197946563363075, -0.039719462394714355, -0.03745946288108826, -0.03519946336746216, -0.03293946012854576, -0.030679458752274513, -0.028419457376003265, -0.026159455999732018, -0.02389945462346077, -0.021639453247189522, -0.019379451870918274, -0.017119450494647026, -0.014859449118375778, -0.01259944774210453, -0.010339446365833282, -0.008079444989562035, -0.005819443613290787, -0.003559442237019539, -0.001299440860748291, 0.0009605605155229568, 0.0032205618917942047, 0.005480563268065453, 0.0077405646443367004, 0.010000566020607948, 0.012260567396879196, 0.014520568773150444, 0.016780570149421692, 0.01904057152569294, 0.021300572901964188, 0.023560574278235435, 0.025820575654506683, 0.02808057703077793, 0.03034057840704918, 0.032600581645965576, 0.034860581159591675, 0.03712058067321777, 0.03938058391213417, 0.04164058715105057, 0.043900586664676666]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 4.0, 4.0, 6.0, 7.0, 9.0, 17.0, 16.0, 19.0, 24.0, 21.0, 29.0, 39.0, 33.0, 39.0, 30.0, 41.0, 34.0, 39.0, 42.0, 39.0, 61.0, 46.0, 34.0, 40.0, 44.0, 33.0, 36.0, 40.0, 36.0, 22.0, 26.0, 15.0, 22.0, 9.0, 10.0, 8.0, 3.0, 6.0, 7.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.020525634288787842, -0.019929347559809685, -0.019333060830831528, -0.01873677410185337, -0.018140487372875214, -0.017544200643897057, -0.0169479139149189, -0.016351627185940742, -0.015755340456962585, -0.015159053727984428, -0.014562766999006271, -0.013966480270028114, -0.013370193541049957, -0.0127739068120718, -0.012177620083093643, -0.011581333354115486, -0.010985046625137329, -0.010388759896159172, -0.009792473167181015, -0.009196186438202858, -0.008599899709224701, -0.008003612980246544, -0.007407326251268387, -0.00681103952229023, -0.006214752793312073, -0.005618466064333916, -0.005022179335355759, -0.004425892606377602, -0.0038296058773994446, -0.0032333191484212875, -0.0026370324194431305, -0.0020407456904649734, -0.0014444589614868164, -0.0008481722325086594, -0.0002518855035305023, 0.0003444012254476547, 0.0009406879544258118, 0.0015369746834039688, 0.002133261412382126, 0.002729548141360283, 0.00332583487033844, 0.003922121599316597, 0.004518408328294754, 0.005114695057272911, 0.005710981786251068, 0.006307268515229225, 0.006903555244207382, 0.007499841973185539, 0.008096128702163696, 0.008692415431141853, 0.00928870216012001, 0.009884988889098167, 0.010481275618076324, 0.011077562347054482, 0.011673849076032639, 0.012270135805010796, 0.012866422533988953, 0.01346270926296711, 0.014058995991945267, 0.014655282720923424, 0.01525156944990158, 0.015847856178879738, 0.016444142907857895, 0.017040429636836052, 0.01763671636581421]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 2.0, 3.0, 6.0, 7.0, 6.0, 10.0, 13.0, 19.0, 24.0, 39.0, 76.0, 118.0, 191.0, 349.0, 609.0, 1354.0, 4803.0, 87034.0, 929523.0, 19418.0, 2770.0, 990.0, 493.0, 277.0, 155.0, 86.0, 68.0, 33.0, 21.0, 13.0, 8.0, 13.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041412353515625, -0.04004621505737305, -0.038680076599121094, -0.03731393814086914, -0.03594779968261719, -0.034581661224365234, -0.03321552276611328, -0.03184938430786133, -0.030483245849609375, -0.029117107391357422, -0.02775096893310547, -0.026384830474853516, -0.025018692016601562, -0.02365255355834961, -0.022286415100097656, -0.020920276641845703, -0.01955413818359375, -0.018187999725341797, -0.016821861267089844, -0.01545572280883789, -0.014089584350585938, -0.012723445892333984, -0.011357307434082031, -0.009991168975830078, -0.008625030517578125, -0.007258892059326172, -0.005892753601074219, -0.004526615142822266, -0.0031604766845703125, -0.0017943382263183594, -0.00042819976806640625, 0.0009379386901855469, 0.0023040771484375, 0.003670215606689453, 0.005036354064941406, 0.006402492523193359, 0.0077686309814453125, 0.009134769439697266, 0.010500907897949219, 0.011867046356201172, 0.013233184814453125, 0.014599323272705078, 0.01596546173095703, 0.017331600189208984, 0.018697738647460938, 0.02006387710571289, 0.021430015563964844, 0.022796154022216797, 0.02416229248046875, 0.025528430938720703, 0.026894569396972656, 0.02826070785522461, 0.029626846313476562, 0.030992984771728516, 0.03235912322998047, 0.03372526168823242, 0.035091400146484375, 0.03645753860473633, 0.03782367706298828, 0.039189815521240234, 0.04055595397949219, 0.04192209243774414, 0.043288230895996094, 0.04465436935424805, 0.0460205078125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 8.0, 43.0, 113.0, 194.0, 244.0, 208.0, 120.0, 47.0, 12.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02069091796875, -0.020014047622680664, -0.019337177276611328, -0.018660306930541992, -0.017983436584472656, -0.01730656623840332, -0.016629695892333984, -0.01595282554626465, -0.015275955200195312, -0.014599084854125977, -0.01392221450805664, -0.013245344161987305, -0.012568473815917969, -0.011891603469848633, -0.011214733123779297, -0.010537862777709961, -0.009860992431640625, -0.009184122085571289, -0.008507251739501953, -0.007830381393432617, -0.007153511047363281, -0.006476640701293945, -0.005799770355224609, -0.0051229000091552734, -0.0044460296630859375, -0.0037691593170166016, -0.0030922889709472656, -0.0024154186248779297, -0.0017385482788085938, -0.0010616779327392578, -0.0003848075866699219, 0.00029206275939941406, 0.00096893310546875, 0.001645803451538086, 0.002322673797607422, 0.002999544143676758, 0.0036764144897460938, 0.00435328483581543, 0.005030155181884766, 0.0057070255279541016, 0.0063838958740234375, 0.0070607662200927734, 0.007737636566162109, 0.008414506912231445, 0.009091377258300781, 0.009768247604370117, 0.010445117950439453, 0.011121988296508789, 0.011798858642578125, 0.012475728988647461, 0.013152599334716797, 0.013829469680786133, 0.014506340026855469, 0.015183210372924805, 0.01586008071899414, 0.016536951065063477, 0.017213821411132812, 0.01789069175720215, 0.018567562103271484, 0.01924443244934082, 0.019921302795410156, 0.020598173141479492, 0.021275043487548828, 0.021951913833618164, 0.0226287841796875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 8.0, 4.0, 7.0, 13.0, 19.0, 21.0, 30.0, 50.0, 70.0, 106.0, 178.0, 335.0, 598.0, 1024.0, 2061.0, 5040.0, 17227.0, 98270.0, 585951.0, 283135.0, 38990.0, 8979.0, 3093.0, 1444.0, 769.0, 448.0, 247.0, 167.0, 94.0, 68.0, 37.0, 18.0, 12.0, 12.0, 10.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01526641845703125, -0.014800310134887695, -0.01433420181274414, -0.013868093490600586, -0.013401985168457031, -0.012935876846313477, -0.012469768524169922, -0.012003660202026367, -0.011537551879882812, -0.011071443557739258, -0.010605335235595703, -0.010139226913452148, -0.009673118591308594, -0.009207010269165039, -0.008740901947021484, -0.00827479362487793, -0.007808685302734375, -0.00734257698059082, -0.006876468658447266, -0.006410360336303711, -0.005944252014160156, -0.0054781436920166016, -0.005012035369873047, -0.004545927047729492, -0.0040798187255859375, -0.003613710403442383, -0.003147602081298828, -0.0026814937591552734, -0.0022153854370117188, -0.001749277114868164, -0.0012831687927246094, -0.0008170604705810547, -0.0003509521484375, 0.00011515617370605469, 0.0005812644958496094, 0.001047372817993164, 0.0015134811401367188, 0.0019795894622802734, 0.002445697784423828, 0.002911806106567383, 0.0033779144287109375, 0.003844022750854492, 0.004310131072998047, 0.0047762393951416016, 0.005242347717285156, 0.005708456039428711, 0.006174564361572266, 0.00664067268371582, 0.007106781005859375, 0.00757288932800293, 0.008038997650146484, 0.008505105972290039, 0.008971214294433594, 0.009437322616577148, 0.009903430938720703, 0.010369539260864258, 0.010835647583007812, 0.011301755905151367, 0.011767864227294922, 0.012233972549438477, 0.012700080871582031, 0.013166189193725586, 0.01363229751586914, 0.014098405838012695, 0.01456451416015625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 9.0, 6.0, 8.0, 5.0, 11.0, 11.0, 12.0, 18.0, 20.0, 33.0, 32.0, 32.0, 57.0, 43.0, 58.0, 69.0, 73.0, 60.0, 82.0, 51.0, 41.0, 48.0, 58.0, 34.0, 29.0, 19.0, 23.0, 16.0, 17.0, 10.0, 6.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0176239013671875, -0.017091989517211914, -0.016560077667236328, -0.016028165817260742, -0.015496253967285156, -0.01496434211730957, -0.014432430267333984, -0.013900518417358398, -0.013368606567382812, -0.012836694717407227, -0.01230478286743164, -0.011772871017456055, -0.011240959167480469, -0.010709047317504883, -0.010177135467529297, -0.009645223617553711, -0.009113311767578125, -0.008581399917602539, -0.008049488067626953, -0.007517576217651367, -0.006985664367675781, -0.006453752517700195, -0.005921840667724609, -0.0053899288177490234, -0.0048580169677734375, -0.0043261051177978516, -0.0037941932678222656, -0.0032622814178466797, -0.0027303695678710938, -0.002198457717895508, -0.0016665458679199219, -0.001134634017944336, -0.00060272216796875, -7.081031799316406e-05, 0.0004611015319824219, 0.0009930133819580078, 0.0015249252319335938, 0.0020568370819091797, 0.0025887489318847656, 0.0031206607818603516, 0.0036525726318359375, 0.0041844844818115234, 0.004716396331787109, 0.005248308181762695, 0.005780220031738281, 0.006312131881713867, 0.006844043731689453, 0.007375955581665039, 0.007907867431640625, 0.008439779281616211, 0.008971691131591797, 0.009503602981567383, 0.010035514831542969, 0.010567426681518555, 0.01109933853149414, 0.011631250381469727, 0.012163162231445312, 0.012695074081420898, 0.013226985931396484, 0.01375889778137207, 0.014290809631347656, 0.014822721481323242, 0.015354633331298828, 0.015886545181274414, 0.01641845703125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 5.0, 1.0, 7.0, 8.0, 12.0, 12.0, 20.0, 22.0, 36.0, 58.0, 87.0, 143.0, 181.0, 309.0, 408.0, 573.0, 865.0, 1374.0, 2114.0, 3449.0, 6337.0, 12124.0, 26700.0, 74310.0, 317933.0, 433749.0, 101564.0, 33314.0, 14416.0, 7304.0, 4108.0, 2429.0, 1481.0, 1012.0, 662.0, 431.0, 298.0, 213.0, 164.0, 102.0, 66.0, 58.0, 25.0, 25.0, 9.0, 10.0, 7.0, 3.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0], "bins": [-0.0029735565185546875, -0.002880990505218506, -0.0027884244918823242, -0.0026958584785461426, -0.002603292465209961, -0.0025107264518737793, -0.0024181604385375977, -0.002325594425201416, -0.0022330284118652344, -0.0021404623985290527, -0.002047896385192871, -0.0019553303718566895, -0.0018627643585205078, -0.0017701983451843262, -0.0016776323318481445, -0.0015850663185119629, -0.0014925003051757812, -0.0013999342918395996, -0.001307368278503418, -0.0012148022651672363, -0.0011222362518310547, -0.001029670238494873, -0.0009371042251586914, -0.0008445382118225098, -0.0007519721984863281, -0.0006594061851501465, -0.0005668401718139648, -0.0004742741584777832, -0.00038170814514160156, -0.0002891421318054199, -0.00019657611846923828, -0.00010401010513305664, -1.1444091796875e-05, 8.112192153930664e-05, 0.00017368793487548828, 0.0002662539482116699, 0.00035881996154785156, 0.0004513859748840332, 0.0005439519882202148, 0.0006365180015563965, 0.0007290840148925781, 0.0008216500282287598, 0.0009142160415649414, 0.001006782054901123, 0.0010993480682373047, 0.0011919140815734863, 0.001284480094909668, 0.0013770461082458496, 0.0014696121215820312, 0.0015621781349182129, 0.0016547441482543945, 0.0017473101615905762, 0.0018398761749267578, 0.0019324421882629395, 0.002025008201599121, 0.0021175742149353027, 0.0022101402282714844, 0.002302706241607666, 0.0023952722549438477, 0.0024878382682800293, 0.002580404281616211, 0.0026729702949523926, 0.0027655363082885742, 0.002858102321624756, 0.0029506683349609375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 7.0, 5.0, 5.0, 7.0, 6.0, 11.0, 13.0, 22.0, 30.0, 26.0, 43.0, 80.0, 114.0, 124.0, 112.0, 119.0, 85.0, 45.0, 44.0, 17.0, 21.0, 20.0, 19.0, 3.0, 7.0, 10.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.936094284057617e-05, -9.62642952799797e-05, -9.316764771938324e-05, -9.007100015878677e-05, -8.697435259819031e-05, -8.387770503759384e-05, -8.078105747699738e-05, -7.768440991640091e-05, -7.458776235580444e-05, -7.149111479520798e-05, -6.839446723461151e-05, -6.529781967401505e-05, -6.220117211341858e-05, -5.910452455282211e-05, -5.600787699222565e-05, -5.291122943162918e-05, -4.9814581871032715e-05, -4.671793431043625e-05, -4.362128674983978e-05, -4.052463918924332e-05, -3.742799162864685e-05, -3.4331344068050385e-05, -3.123469650745392e-05, -2.8138048946857452e-05, -2.5041401386260986e-05, -2.194475382566452e-05, -1.8848106265068054e-05, -1.5751458704471588e-05, -1.2654811143875122e-05, -9.558163583278656e-06, -6.46151602268219e-06, -3.364868462085724e-06, -2.682209014892578e-07, 2.8284266591072083e-06, 5.925074219703674e-06, 9.02172178030014e-06, 1.2118369340896606e-05, 1.5215016901493073e-05, 1.831166446208954e-05, 2.1408312022686005e-05, 2.450495958328247e-05, 2.7601607143878937e-05, 3.06982547044754e-05, 3.379490226507187e-05, 3.6891549825668335e-05, 3.99881973862648e-05, 4.308484494686127e-05, 4.618149250745773e-05, 4.92781400680542e-05, 5.2374787628650665e-05, 5.547143518924713e-05, 5.85680827498436e-05, 6.166473031044006e-05, 6.476137787103653e-05, 6.7858025431633e-05, 7.095467299222946e-05, 7.405132055282593e-05, 7.71479681134224e-05, 8.024461567401886e-05, 8.334126323461533e-05, 8.643791079521179e-05, 8.953455835580826e-05, 9.263120591640472e-05, 9.572785347700119e-05, 9.882450103759766e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 9.0, 13.0, 16.0, 21.0, 28.0, 37.0, 66.0, 124.0, 244.0, 455.0, 873.0, 1955.0, 4469.0, 12323.0, 40247.0, 221186.0, 626766.0, 101532.0, 24098.0, 8058.0, 3083.0, 1451.0, 700.0, 323.0, 206.0, 100.0, 61.0, 33.0, 16.0, 15.0, 12.0, 8.0, 5.0, 5.0, 6.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.005031585693359375, -0.00488048791885376, -0.0047293901443481445, -0.004578292369842529, -0.004427194595336914, -0.004276096820831299, -0.004124999046325684, -0.003973901271820068, -0.003822803497314453, -0.003671705722808838, -0.0035206079483032227, -0.0033695101737976074, -0.003218412399291992, -0.003067314624786377, -0.0029162168502807617, -0.0027651190757751465, -0.0026140213012695312, -0.002462923526763916, -0.0023118257522583008, -0.0021607279777526855, -0.0020096302032470703, -0.001858532428741455, -0.0017074346542358398, -0.0015563368797302246, -0.0014052391052246094, -0.0012541413307189941, -0.001103043556213379, -0.0009519457817077637, -0.0008008480072021484, -0.0006497502326965332, -0.000498652458190918, -0.00034755468368530273, -0.0001964569091796875, -4.5359134674072266e-05, 0.00010573863983154297, 0.0002568364143371582, 0.00040793418884277344, 0.0005590319633483887, 0.0007101297378540039, 0.0008612275123596191, 0.0010123252868652344, 0.0011634230613708496, 0.0013145208358764648, 0.00146561861038208, 0.0016167163848876953, 0.0017678141593933105, 0.0019189119338989258, 0.002070009708404541, 0.0022211074829101562, 0.0023722052574157715, 0.0025233030319213867, 0.002674400806427002, 0.002825498580932617, 0.0029765963554382324, 0.0031276941299438477, 0.003278791904449463, 0.003429889678955078, 0.0035809874534606934, 0.0037320852279663086, 0.003883183002471924, 0.004034280776977539, 0.004185378551483154, 0.0043364763259887695, 0.004487574100494385, 0.004638671875]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 10.0, 9.0, 17.0, 21.0, 29.0, 37.0, 47.0, 70.0, 106.0, 136.0, 123.0, 103.0, 83.0, 63.0, 41.0, 26.0, 21.0, 15.0, 12.0, 4.0, 3.0, 9.0, 1.0, 3.0, 0.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034809112548828125, -0.003347426652908325, -0.003213942050933838, -0.0030804574489593506, -0.0029469728469848633, -0.002813488245010376, -0.0026800036430358887, -0.0025465190410614014, -0.002413034439086914, -0.0022795498371124268, -0.0021460652351379395, -0.002012580633163452, -0.0018790960311889648, -0.0017456114292144775, -0.0016121268272399902, -0.001478642225265503, -0.0013451576232910156, -0.0012116730213165283, -0.001078188419342041, -0.0009447038173675537, -0.0008112192153930664, -0.0006777346134185791, -0.0005442500114440918, -0.0004107654094696045, -0.0002772808074951172, -0.00014379620552062988, -1.0311603546142578e-05, 0.00012317299842834473, 0.00025665760040283203, 0.00039014220237731934, 0.0005236268043518066, 0.0006571114063262939, 0.0007905960083007812, 0.0009240806102752686, 0.0010575652122497559, 0.0011910498142242432, 0.0013245344161987305, 0.0014580190181732178, 0.001591503620147705, 0.0017249882221221924, 0.0018584728240966797, 0.001991957426071167, 0.0021254420280456543, 0.0022589266300201416, 0.002392411231994629, 0.002525895833969116, 0.0026593804359436035, 0.002792865037918091, 0.002926349639892578, 0.0030598342418670654, 0.0031933188438415527, 0.00332680344581604, 0.0034602880477905273, 0.0035937726497650146, 0.003727257251739502, 0.0038607418537139893, 0.0039942264556884766, 0.004127711057662964, 0.004261195659637451, 0.0043946802616119385, 0.004528164863586426, 0.004661649465560913, 0.0047951340675354, 0.004928618669509888, 0.005062103271484375]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 20.0, 49.0, 117.0, 202.0, 273.0, 162.0, 76.0, 60.0, 17.0, 11.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08436357975006104, -0.08147940039634705, -0.07859522104263306, -0.07571104168891907, -0.07282686233520508, -0.06994268298149109, -0.0670585036277771, -0.06417432427406311, -0.06129014864563942, -0.05840596929192543, -0.05552178993821144, -0.05263761430978775, -0.04975343495607376, -0.04686925560235977, -0.04398507624864578, -0.04110089689493179, -0.038216717541217804, -0.035332538187503815, -0.032448358833789825, -0.029564181342720985, -0.026680001989006996, -0.023795822635293007, -0.020911645144224167, -0.018027465790510178, -0.015143286436796188, -0.012259107083082199, -0.009374928660690784, -0.00649075023829937, -0.0036065708845853806, -0.0007223915308713913, 0.0021617859601974487, 0.005045965313911438, 0.007930144667625427, 0.010814324021339417, 0.013698502443730831, 0.016582680866122246, 0.019466860219836235, 0.022351039573550224, 0.025235217064619064, 0.028119396418333054, 0.031003575772047043, 0.03388775512576103, 0.03677193447947502, 0.03965611010789871, 0.0425402894616127, 0.04542446881532669, 0.04830864816904068, 0.05119282752275467, 0.05407700687646866, 0.05696118623018265, 0.05984536558389664, 0.06272954493761063, 0.06561372429132462, 0.0684979036450386, 0.071382075548172, 0.07426625490188599, 0.07715043425559998, 0.08003461360931396, 0.08291879296302795, 0.08580297231674194, 0.08868715167045593, 0.09157133102416992, 0.09445551037788391, 0.0973396897315979, 0.10022386908531189]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 6.0, 4.0, 7.0, 4.0, 11.0, 10.0, 5.0, 12.0, 15.0, 17.0, 18.0, 18.0, 15.0, 14.0, 18.0, 42.0, 32.0, 40.0, 30.0, 28.0, 53.0, 32.0, 42.0, 46.0, 44.0, 39.0, 44.0, 38.0, 53.0, 35.0, 37.0, 33.0, 26.0, 18.0, 18.0, 14.0, 11.0, 18.0, 10.0, 13.0, 6.0, 5.0, 4.0, 6.0, 4.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033133864402770996, -0.032058119773864746, -0.030982377007603645, -0.029906634241342545, -0.028830889612436295, -0.027755144983530045, -0.026679402217268944, -0.025603659451007843, -0.024527914822101593, -0.023452170193195343, -0.022376427426934242, -0.02130068466067314, -0.02022494003176689, -0.01914919540286064, -0.01807345263659954, -0.01699770987033844, -0.01592196524143219, -0.014846221543848515, -0.01377047784626484, -0.012694734148681164, -0.011618990451097488, -0.010543246753513813, -0.009467503055930138, -0.008391759358346462, -0.007316015660762787, -0.0062402719631791115, -0.005164528265595436, -0.004088784568011761, -0.0030130408704280853, -0.00193729717284441, -0.0008615534752607346, 0.00021419022232294083, 0.0012899339199066162, 0.0023656776174902916, 0.003441421315073967, 0.004517165012657642, 0.005592908710241318, 0.006668652407824993, 0.0077443961054086685, 0.008820139802992344, 0.00989588350057602, 0.010971627198159695, 0.01204737089574337, 0.013123114593327045, 0.01419885829091072, 0.015274601988494396, 0.01635034568607807, 0.017426088452339172, 0.018501833081245422, 0.019577577710151672, 0.020653320476412773, 0.021729063242673874, 0.022804807871580124, 0.023880552500486374, 0.024956295266747475, 0.026032038033008575, 0.027107782661914825, 0.028183527290821075, 0.029259270057082176, 0.030335012823343277, 0.03141075745224953, 0.03248650208115578, 0.03356224298477173, 0.03463798761367798, 0.03571373224258423]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 6.0, 0.0, 6.0, 5.0, 9.0, 16.0, 20.0, 24.0, 27.0, 45.0, 91.0, 99.0, 158.0, 222.0, 521.0, 1240.0, 2800.0, 8611.0, 122197.0, 4002190.0, 45941.0, 6566.0, 1902.0, 713.0, 287.0, 178.0, 120.0, 75.0, 57.0, 48.0, 25.0, 21.0, 15.0, 12.0, 12.0, 5.0, 3.0, 5.0, 1.0, 7.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.02362060546875, -0.022787809371948242, -0.021955013275146484, -0.021122217178344727, -0.02028942108154297, -0.01945662498474121, -0.018623828887939453, -0.017791032791137695, -0.016958236694335938, -0.01612544059753418, -0.015292644500732422, -0.014459848403930664, -0.013627052307128906, -0.012794256210327148, -0.01196146011352539, -0.011128664016723633, -0.010295867919921875, -0.009463071823120117, -0.00863027572631836, -0.0077974796295166016, -0.006964683532714844, -0.006131887435913086, -0.005299091339111328, -0.00446629524230957, -0.0036334991455078125, -0.0028007030487060547, -0.001967906951904297, -0.001135110855102539, -0.00030231475830078125, 0.0005304813385009766, 0.0013632774353027344, 0.002196073532104492, 0.00302886962890625, 0.003861665725708008, 0.004694461822509766, 0.0055272579193115234, 0.006360054016113281, 0.007192850112915039, 0.008025646209716797, 0.008858442306518555, 0.009691238403320312, 0.01052403450012207, 0.011356830596923828, 0.012189626693725586, 0.013022422790527344, 0.013855218887329102, 0.01468801498413086, 0.015520811080932617, 0.016353607177734375, 0.017186403274536133, 0.01801919937133789, 0.01885199546813965, 0.019684791564941406, 0.020517587661743164, 0.021350383758544922, 0.02218317985534668, 0.023015975952148438, 0.023848772048950195, 0.024681568145751953, 0.02551436424255371, 0.02634716033935547, 0.027179956436157227, 0.028012752532958984, 0.028845548629760742, 0.0296783447265625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 5.0, 20.0, 85.0, 155.0, 202.0, 246.0, 168.0, 87.0, 19.0, 12.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0213775634765625, -0.020689725875854492, -0.020001888275146484, -0.019314050674438477, -0.01862621307373047, -0.01793837547302246, -0.017250537872314453, -0.016562700271606445, -0.015874862670898438, -0.01518702507019043, -0.014499187469482422, -0.013811349868774414, -0.013123512268066406, -0.012435674667358398, -0.01174783706665039, -0.011059999465942383, -0.010372161865234375, -0.009684324264526367, -0.00899648666381836, -0.008308649063110352, -0.007620811462402344, -0.006932973861694336, -0.006245136260986328, -0.00555729866027832, -0.0048694610595703125, -0.004181623458862305, -0.003493785858154297, -0.002805948257446289, -0.0021181106567382812, -0.0014302730560302734, -0.0007424354553222656, -5.459785461425781e-05, 0.00063323974609375, 0.0013210773468017578, 0.0020089149475097656, 0.0026967525482177734, 0.0033845901489257812, 0.004072427749633789, 0.004760265350341797, 0.005448102951049805, 0.0061359405517578125, 0.00682377815246582, 0.007511615753173828, 0.008199453353881836, 0.008887290954589844, 0.009575128555297852, 0.01026296615600586, 0.010950803756713867, 0.011638641357421875, 0.012326478958129883, 0.01301431655883789, 0.013702154159545898, 0.014389991760253906, 0.015077829360961914, 0.015765666961669922, 0.01645350456237793, 0.017141342163085938, 0.017829179763793945, 0.018517017364501953, 0.01920485496520996, 0.01989269256591797, 0.020580530166625977, 0.021268367767333984, 0.021956205368041992, 0.02264404296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 8.0, 11.0, 8.0, 19.0, 38.0, 59.0, 87.0, 185.0, 310.0, 534.0, 995.0, 1870.0, 3937.0, 9984.0, 34574.0, 223639.0, 3609495.0, 251562.0, 37799.0, 10791.0, 4154.0, 1966.0, 1028.0, 529.0, 311.0, 156.0, 99.0, 61.0, 29.0, 28.0, 10.0, 8.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01122283935546875, -0.010877728462219238, -0.010532617568969727, -0.010187506675720215, -0.009842395782470703, -0.009497284889221191, -0.00915217399597168, -0.008807063102722168, -0.008461952209472656, -0.008116841316223145, -0.007771730422973633, -0.007426619529724121, -0.007081508636474609, -0.006736397743225098, -0.006391286849975586, -0.006046175956726074, -0.0057010650634765625, -0.005355954170227051, -0.005010843276977539, -0.004665732383728027, -0.004320621490478516, -0.003975510597229004, -0.003630399703979492, -0.0032852888107299805, -0.0029401779174804688, -0.002595067024230957, -0.0022499561309814453, -0.0019048452377319336, -0.0015597343444824219, -0.0012146234512329102, -0.0008695125579833984, -0.0005244016647338867, -0.000179290771484375, 0.00016582012176513672, 0.0005109310150146484, 0.0008560419082641602, 0.0012011528015136719, 0.0015462636947631836, 0.0018913745880126953, 0.002236485481262207, 0.0025815963745117188, 0.0029267072677612305, 0.003271818161010742, 0.003616929054260254, 0.003962039947509766, 0.004307150840759277, 0.004652261734008789, 0.004997372627258301, 0.0053424835205078125, 0.005687594413757324, 0.006032705307006836, 0.006377816200256348, 0.006722927093505859, 0.007068037986755371, 0.007413148880004883, 0.0077582597732543945, 0.008103370666503906, 0.008448481559753418, 0.00879359245300293, 0.009138703346252441, 0.009483814239501953, 0.009828925132751465, 0.010174036026000977, 0.010519146919250488, 0.0108642578125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 2.0, 8.0, 7.0, 20.0, 28.0, 47.0, 87.0, 164.0, 547.0, 1425.0, 991.0, 324.0, 125.0, 80.0, 63.0, 42.0, 36.0, 20.0, 11.0, 8.0, 6.0, 8.0, 5.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0121002197265625, -0.011770963668823242, -0.011441707611083984, -0.011112451553344727, -0.010783195495605469, -0.010453939437866211, -0.010124683380126953, -0.009795427322387695, -0.009466171264648438, -0.00913691520690918, -0.008807659149169922, -0.008478403091430664, -0.008149147033691406, -0.007819890975952148, -0.007490634918212891, -0.007161378860473633, -0.006832122802734375, -0.006502866744995117, -0.006173610687255859, -0.0058443546295166016, -0.005515098571777344, -0.005185842514038086, -0.004856586456298828, -0.00452733039855957, -0.0041980743408203125, -0.0038688182830810547, -0.003539562225341797, -0.003210306167602539, -0.0028810501098632812, -0.0025517940521240234, -0.0022225379943847656, -0.0018932819366455078, -0.00156402587890625, -0.0012347698211669922, -0.0009055137634277344, -0.0005762577056884766, -0.00024700164794921875, 8.225440979003906e-05, 0.0004115104675292969, 0.0007407665252685547, 0.0010700225830078125, 0.0013992786407470703, 0.0017285346984863281, 0.002057790756225586, 0.0023870468139648438, 0.0027163028717041016, 0.0030455589294433594, 0.003374814987182617, 0.003704071044921875, 0.004033327102661133, 0.004362583160400391, 0.0046918392181396484, 0.005021095275878906, 0.005350351333618164, 0.005679607391357422, 0.00600886344909668, 0.0063381195068359375, 0.006667375564575195, 0.006996631622314453, 0.007325887680053711, 0.007655143737792969, 0.007984399795532227, 0.008313655853271484, 0.008642911911010742, 0.00897216796875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 12.0, 103.0, 369.0, 380.0, 107.0, 27.0, 8.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13586591184139252, -0.13217034935951233, -0.12847478687763214, -0.12477922439575195, -0.12108366191387177, -0.11738809943199158, -0.11369254440069199, -0.1099969819188118, -0.10630141943693161, -0.10260585695505142, -0.09891029447317123, -0.09521473199129105, -0.09151917695999146, -0.08782361447811127, -0.08412805199623108, -0.08043248951435089, -0.0767369270324707, -0.07304136455059052, -0.06934580206871033, -0.06565023958683014, -0.06195468083024025, -0.05825911834836006, -0.05456355959177017, -0.050867997109889984, -0.047172434628009796, -0.04347687214612961, -0.03978130966424942, -0.03608575090765953, -0.03239018842577934, -0.028694625943899155, -0.024999065324664116, -0.021303504705429077, -0.01760794222354889, -0.013912380672991276, -0.010216819122433662, -0.006521257571876049, -0.0028256960213184357, 0.0008698664605617523, 0.004565427079796791, 0.00826098769903183, 0.011956550180912018, 0.015652112662792206, 0.019347673282027245, 0.023043233901262283, 0.02673879638314247, 0.03043435886502266, 0.03412991762161255, 0.03782548010349274, 0.041521042585372925, 0.04521660506725311, 0.0489121675491333, 0.05260772630572319, 0.05630328878760338, 0.059998851269483566, 0.06369441002607346, 0.06738997250795364, 0.07108553498983383, 0.07478109747171402, 0.07847665995359421, 0.0821722224354744, 0.08586777746677399, 0.08956333994865417, 0.09325890243053436, 0.09695446491241455, 0.10065002739429474]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 6.0, 11.0, 10.0, 10.0, 10.0, 13.0, 18.0, 15.0, 20.0, 24.0, 27.0, 30.0, 40.0, 42.0, 35.0, 46.0, 47.0, 37.0, 51.0, 48.0, 47.0, 48.0, 38.0, 42.0, 30.0, 29.0, 35.0, 23.0, 28.0, 22.0, 16.0, 15.0, 16.0, 12.0, 14.0, 10.0, 10.0, 13.0, 2.0, 1.0, 4.0, 7.0, 3.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021767079830169678, -0.021027568727731705, -0.02028805762529373, -0.01954854652285576, -0.018809035420417786, -0.018069524317979813, -0.01733001321554184, -0.016590502113103867, -0.015850991010665894, -0.01511147990822792, -0.014371968805789948, -0.013632457703351974, -0.012892946600914001, -0.012153435498476028, -0.011413924396038055, -0.010674413293600082, -0.00993490219116211, -0.009195391088724136, -0.008455879986286163, -0.00771636888384819, -0.006976857781410217, -0.006237346678972244, -0.005497835576534271, -0.004758324474096298, -0.004018813371658325, -0.003279302269220352, -0.002539791166782379, -0.0018002800643444061, -0.001060768961906433, -0.0003212578594684601, 0.00041825324296951294, 0.001157764345407486, 0.001897275447845459, 0.002636786550283432, 0.003376297652721405, 0.004115808755159378, 0.004855319857597351, 0.005594830960035324, 0.006334342062473297, 0.00707385316491127, 0.007813364267349243, 0.008552875369787216, 0.00929238647222519, 0.010031897574663162, 0.010771408677101135, 0.011510919779539108, 0.012250430881977081, 0.012989941984415054, 0.013729453086853027, 0.014468964189291, 0.015208475291728973, 0.015947986394166946, 0.01668749749660492, 0.017427008599042892, 0.018166519701480865, 0.01890603080391884, 0.01964554190635681, 0.020385053008794785, 0.021124564111232758, 0.02186407521367073, 0.022603586316108704, 0.023343097418546677, 0.02408260852098465, 0.024822119623422623, 0.025561630725860596]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 15.0, 11.0, 26.0, 40.0, 40.0, 63.0, 98.0, 123.0, 161.0, 195.0, 331.0, 454.0, 797.0, 1613.0, 5223.0, 44350.0, 818456.0, 161439.0, 9970.0, 2325.0, 954.0, 585.0, 365.0, 270.0, 182.0, 131.0, 85.0, 80.0, 48.0, 28.0, 28.0, 20.0, 12.0, 6.0, 6.0, 9.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0274200439453125, -0.026581287384033203, -0.025742530822753906, -0.02490377426147461, -0.024065017700195312, -0.023226261138916016, -0.02238750457763672, -0.021548748016357422, -0.020709991455078125, -0.019871234893798828, -0.01903247833251953, -0.018193721771240234, -0.017354965209960938, -0.01651620864868164, -0.015677452087402344, -0.014838695526123047, -0.01399993896484375, -0.013161182403564453, -0.012322425842285156, -0.01148366928100586, -0.010644912719726562, -0.009806156158447266, -0.008967399597167969, -0.008128643035888672, -0.007289886474609375, -0.006451129913330078, -0.005612373352050781, -0.004773616790771484, -0.0039348602294921875, -0.0030961036682128906, -0.0022573471069335938, -0.0014185905456542969, -0.000579833984375, 0.0002589225769042969, 0.0010976791381835938, 0.0019364356994628906, 0.0027751922607421875, 0.0036139488220214844, 0.004452705383300781, 0.005291461944580078, 0.006130218505859375, 0.006968975067138672, 0.007807731628417969, 0.008646488189697266, 0.009485244750976562, 0.01032400131225586, 0.011162757873535156, 0.012001514434814453, 0.01284027099609375, 0.013679027557373047, 0.014517784118652344, 0.01535654067993164, 0.016195297241210938, 0.017034053802490234, 0.01787281036376953, 0.018711566925048828, 0.019550323486328125, 0.020389080047607422, 0.02122783660888672, 0.022066593170166016, 0.022905349731445312, 0.02374410629272461, 0.024582862854003906, 0.025421619415283203, 0.0262603759765625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 7.0, 31.0, 87.0, 159.0, 215.0, 223.0, 166.0, 73.0, 25.0, 13.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.021270751953125, -0.020583629608154297, -0.019896507263183594, -0.01920938491821289, -0.018522262573242188, -0.017835140228271484, -0.01714801788330078, -0.016460895538330078, -0.015773773193359375, -0.015086650848388672, -0.014399528503417969, -0.013712406158447266, -0.013025283813476562, -0.01233816146850586, -0.011651039123535156, -0.010963916778564453, -0.01027679443359375, -0.009589672088623047, -0.008902549743652344, -0.00821542739868164, -0.0075283050537109375, -0.006841182708740234, -0.006154060363769531, -0.005466938018798828, -0.004779815673828125, -0.004092693328857422, -0.0034055709838867188, -0.0027184486389160156, -0.0020313262939453125, -0.0013442039489746094, -0.0006570816040039062, 3.0040740966796875e-05, 0.0007171630859375, 0.0014042854309082031, 0.0020914077758789062, 0.0027785301208496094, 0.0034656524658203125, 0.004152774810791016, 0.004839897155761719, 0.005527019500732422, 0.006214141845703125, 0.006901264190673828, 0.007588386535644531, 0.008275508880615234, 0.008962631225585938, 0.00964975357055664, 0.010336875915527344, 0.011023998260498047, 0.01171112060546875, 0.012398242950439453, 0.013085365295410156, 0.01377248764038086, 0.014459609985351562, 0.015146732330322266, 0.01583385467529297, 0.016520977020263672, 0.017208099365234375, 0.017895221710205078, 0.01858234405517578, 0.019269466400146484, 0.019956588745117188, 0.02064371109008789, 0.021330833435058594, 0.022017955780029297, 0.022705078125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 15.0, 20.0, 25.0, 52.0, 59.0, 97.0, 149.0, 235.0, 420.0, 678.0, 1394.0, 2722.0, 6078.0, 14114.0, 42606.0, 172000.0, 495871.0, 227357.0, 53795.0, 17143.0, 6846.0, 3271.0, 1606.0, 809.0, 434.0, 286.0, 139.0, 105.0, 73.0, 34.0, 23.0, 16.0, 13.0, 13.0, 6.0, 7.0, 7.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0104827880859375, -0.010161161422729492, -0.009839534759521484, -0.009517908096313477, -0.009196281433105469, -0.008874654769897461, -0.008553028106689453, -0.008231401443481445, -0.007909774780273438, -0.00758814811706543, -0.007266521453857422, -0.006944894790649414, -0.006623268127441406, -0.0063016414642333984, -0.005980014801025391, -0.005658388137817383, -0.005336761474609375, -0.005015134811401367, -0.004693508148193359, -0.0043718814849853516, -0.004050254821777344, -0.003728628158569336, -0.003407001495361328, -0.0030853748321533203, -0.0027637481689453125, -0.0024421215057373047, -0.002120494842529297, -0.001798868179321289, -0.0014772415161132812, -0.0011556148529052734, -0.0008339881896972656, -0.0005123615264892578, -0.00019073486328125, 0.0001308917999267578, 0.0004525184631347656, 0.0007741451263427734, 0.0010957717895507812, 0.001417398452758789, 0.0017390251159667969, 0.0020606517791748047, 0.0023822784423828125, 0.0027039051055908203, 0.003025531768798828, 0.003347158432006836, 0.0036687850952148438, 0.0039904117584228516, 0.004312038421630859, 0.004633665084838867, 0.004955291748046875, 0.005276918411254883, 0.005598545074462891, 0.0059201717376708984, 0.006241798400878906, 0.006563425064086914, 0.006885051727294922, 0.00720667839050293, 0.0075283050537109375, 0.007849931716918945, 0.008171558380126953, 0.008493185043334961, 0.008814811706542969, 0.009136438369750977, 0.009458065032958984, 0.009779691696166992, 0.010101318359375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 3.0, 4.0, 7.0, 11.0, 16.0, 15.0, 13.0, 13.0, 19.0, 32.0, 24.0, 34.0, 37.0, 57.0, 47.0, 55.0, 59.0, 62.0, 51.0, 50.0, 50.0, 34.0, 51.0, 41.0, 36.0, 25.0, 32.0, 28.0, 15.0, 19.0, 8.0, 7.0, 11.0, 10.0, 6.0, 5.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0156707763671875, -0.015208601951599121, -0.014746427536010742, -0.014284253120422363, -0.013822078704833984, -0.013359904289245605, -0.012897729873657227, -0.012435555458068848, -0.011973381042480469, -0.01151120662689209, -0.011049032211303711, -0.010586857795715332, -0.010124683380126953, -0.009662508964538574, -0.009200334548950195, -0.008738160133361816, -0.008275985717773438, -0.007813811302185059, -0.00735163688659668, -0.006889462471008301, -0.006427288055419922, -0.005965113639831543, -0.005502939224243164, -0.005040764808654785, -0.004578590393066406, -0.004116415977478027, -0.0036542415618896484, -0.0031920671463012695, -0.0027298927307128906, -0.0022677183151245117, -0.0018055438995361328, -0.001343369483947754, -0.000881195068359375, -0.0004190206527709961, 4.315376281738281e-05, 0.0005053281784057617, 0.0009675025939941406, 0.0014296770095825195, 0.0018918514251708984, 0.0023540258407592773, 0.0028162002563476562, 0.003278374671936035, 0.003740549087524414, 0.004202723503112793, 0.004664897918701172, 0.005127072334289551, 0.00558924674987793, 0.006051421165466309, 0.0065135955810546875, 0.006975769996643066, 0.007437944412231445, 0.007900118827819824, 0.008362293243408203, 0.008824467658996582, 0.009286642074584961, 0.00974881649017334, 0.010210990905761719, 0.010673165321350098, 0.011135339736938477, 0.011597514152526855, 0.012059688568115234, 0.012521862983703613, 0.012984037399291992, 0.013446211814880371, 0.01390838623046875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 11.0, 8.0, 22.0, 23.0, 32.0, 55.0, 62.0, 161.0, 213.0, 387.0, 646.0, 1274.0, 2394.0, 4585.0, 10083.0, 31761.0, 267382.0, 643935.0, 58421.0, 14586.0, 5963.0, 2935.0, 1563.0, 797.0, 521.0, 282.0, 158.0, 91.0, 60.0, 40.0, 31.0, 19.0, 13.0, 7.0, 7.0, 4.0, 2.0, 1.0, 2.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00710296630859375, -0.0068416595458984375, -0.006580352783203125, -0.0063190460205078125, -0.0060577392578125, -0.0057964324951171875, -0.005535125732421875, -0.0052738189697265625, -0.00501251220703125, -0.0047512054443359375, -0.004489898681640625, -0.0042285919189453125, -0.00396728515625, -0.0037059783935546875, -0.003444671630859375, -0.0031833648681640625, -0.00292205810546875, -0.0026607513427734375, -0.002399444580078125, -0.0021381378173828125, -0.0018768310546875, -0.0016155242919921875, -0.001354217529296875, -0.0010929107666015625, -0.00083160400390625, -0.0005702972412109375, -0.000308990478515625, -4.76837158203125e-05, 0.000213623046875, 0.0004749298095703125, 0.000736236572265625, 0.0009975433349609375, 0.00125885009765625, 0.0015201568603515625, 0.001781463623046875, 0.0020427703857421875, 0.0023040771484375, 0.0025653839111328125, 0.002826690673828125, 0.0030879974365234375, 0.00334930419921875, 0.0036106109619140625, 0.003871917724609375, 0.0041332244873046875, 0.00439453125, 0.0046558380126953125, 0.004917144775390625, 0.0051784515380859375, 0.00543975830078125, 0.0057010650634765625, 0.005962371826171875, 0.0062236785888671875, 0.0064849853515625, 0.0067462921142578125, 0.007007598876953125, 0.0072689056396484375, 0.00753021240234375, 0.0077915191650390625, 0.008052825927734375, 0.008314132690429688, 0.008575439453125, 0.008836746215820312, 0.009098052978515625, 0.009359359741210938, 0.00962066650390625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 1.0, 10.0, 4.0, 10.0, 18.0, 16.0, 19.0, 35.0, 43.0, 40.0, 58.0, 78.0, 97.0, 103.0, 92.0, 66.0, 71.0, 55.0, 42.0, 30.0, 27.0, 25.0, 11.0, 15.0, 10.0, 10.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.232759475708008e-05, -8.88453796505928e-05, -8.536316454410553e-05, -8.188094943761826e-05, -7.839873433113098e-05, -7.491651922464371e-05, -7.143430411815643e-05, -6.795208901166916e-05, -6.446987390518188e-05, -6.098765879869461e-05, -5.7505443692207336e-05, -5.402322858572006e-05, -5.054101347923279e-05, -4.7058798372745514e-05, -4.357658326625824e-05, -4.0094368159770966e-05, -3.661215305328369e-05, -3.312993794679642e-05, -2.9647722840309143e-05, -2.616550773382187e-05, -2.2683292627334595e-05, -1.920107752084732e-05, -1.5718862414360046e-05, -1.2236647307872772e-05, -8.754432201385498e-06, -5.272217094898224e-06, -1.7900019884109497e-06, 1.6922131180763245e-06, 5.174428224563599e-06, 8.656643331050873e-06, 1.2138858437538147e-05, 1.562107354402542e-05, 1.9103288650512695e-05, 2.258550375699997e-05, 2.6067718863487244e-05, 2.9549933969974518e-05, 3.303214907646179e-05, 3.6514364182949066e-05, 3.999657928943634e-05, 4.3478794395923615e-05, 4.696100950241089e-05, 5.044322460889816e-05, 5.392543971538544e-05, 5.740765482187271e-05, 6.0889869928359985e-05, 6.437208503484726e-05, 6.785430014133453e-05, 7.133651524782181e-05, 7.481873035430908e-05, 7.830094546079636e-05, 8.178316056728363e-05, 8.52653756737709e-05, 8.874759078025818e-05, 9.222980588674545e-05, 9.571202099323273e-05, 9.919423609972e-05, 0.00010267645120620728, 0.00010615866631269455, 0.00010964088141918182, 0.0001131230965256691, 0.00011660531163215637, 0.00012008752673864365, 0.00012356974184513092, 0.0001270519569516182, 0.00013053417205810547]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 6.0, 13.0, 14.0, 26.0, 44.0, 55.0, 90.0, 165.0, 276.0, 397.0, 763.0, 1505.0, 3187.0, 8295.0, 33752.0, 564664.0, 393983.0, 27728.0, 7478.0, 2977.0, 1350.0, 687.0, 411.0, 255.0, 161.0, 103.0, 64.0, 38.0, 23.0, 11.0, 8.0, 9.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0092926025390625, -0.008971571922302246, -0.008650541305541992, -0.008329510688781738, -0.008008480072021484, -0.0076874494552612305, -0.0073664188385009766, -0.007045388221740723, -0.006724357604980469, -0.006403326988220215, -0.006082296371459961, -0.005761265754699707, -0.005440235137939453, -0.005119204521179199, -0.004798173904418945, -0.004477143287658691, -0.0041561126708984375, -0.0038350820541381836, -0.0035140514373779297, -0.0031930208206176758, -0.002871990203857422, -0.002550959587097168, -0.002229928970336914, -0.0019088983535766602, -0.0015878677368164062, -0.0012668371200561523, -0.0009458065032958984, -0.0006247758865356445, -0.0003037452697753906, 1.728534698486328e-05, 0.0003383159637451172, 0.0006593465805053711, 0.000980377197265625, 0.001301407814025879, 0.0016224384307861328, 0.0019434690475463867, 0.0022644996643066406, 0.0025855302810668945, 0.0029065608978271484, 0.0032275915145874023, 0.0035486221313476562, 0.00386965274810791, 0.004190683364868164, 0.004511713981628418, 0.004832744598388672, 0.005153775215148926, 0.00547480583190918, 0.005795836448669434, 0.0061168670654296875, 0.006437897682189941, 0.006758928298950195, 0.007079958915710449, 0.007400989532470703, 0.007722020149230957, 0.008043050765991211, 0.008364081382751465, 0.008685111999511719, 0.009006142616271973, 0.009327173233032227, 0.00964820384979248, 0.009969234466552734, 0.010290265083312988, 0.010611295700073242, 0.010932326316833496, 0.01125335693359375]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 5.0, 4.0, 11.0, 5.0, 3.0, 14.0, 23.0, 38.0, 88.0, 177.0, 305.0, 143.0, 72.0, 41.0, 14.0, 14.0, 9.0, 9.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0105133056640625, -0.010216474533081055, -0.00991964340209961, -0.009622812271118164, -0.009325981140136719, -0.009029150009155273, -0.008732318878173828, -0.008435487747192383, -0.008138656616210938, -0.007841825485229492, -0.007544994354248047, -0.0072481632232666016, -0.006951332092285156, -0.006654500961303711, -0.006357669830322266, -0.00606083869934082, -0.005764007568359375, -0.00546717643737793, -0.005170345306396484, -0.004873514175415039, -0.004576683044433594, -0.0042798519134521484, -0.003983020782470703, -0.003686189651489258, -0.0033893585205078125, -0.003092527389526367, -0.002795696258544922, -0.0024988651275634766, -0.0022020339965820312, -0.001905202865600586, -0.0016083717346191406, -0.0013115406036376953, -0.00101470947265625, -0.0007178783416748047, -0.0004210472106933594, -0.00012421607971191406, 0.00017261505126953125, 0.00046944618225097656, 0.0007662773132324219, 0.0010631084442138672, 0.0013599395751953125, 0.0016567707061767578, 0.001953601837158203, 0.0022504329681396484, 0.0025472640991210938, 0.002844095230102539, 0.0031409263610839844, 0.0034377574920654297, 0.003734588623046875, 0.00403141975402832, 0.004328250885009766, 0.004625082015991211, 0.004921913146972656, 0.0052187442779541016, 0.005515575408935547, 0.005812406539916992, 0.0061092376708984375, 0.006406068801879883, 0.006702899932861328, 0.0069997310638427734, 0.007296562194824219, 0.007593393325805664, 0.00789022445678711, 0.008187055587768555, 0.00848388671875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 25.0, 111.0, 525.0, 288.0, 52.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07419072836637497, -0.06646933406591415, -0.05874794349074364, -0.05102655291557312, -0.043305158615112305, -0.03558376803994179, -0.02786237746477127, -0.020140983164310455, -0.012419592589139938, -0.0046982006169855595, 0.0030231913551688194, 0.010744582861661911, 0.018465975299477577, 0.026187367737293243, 0.03390875831246376, 0.041630152612924576, 0.04935154318809509, 0.05707293376326561, 0.06479432433843613, 0.07251571863889694, 0.08023711293935776, 0.08795849978923798, 0.09567989408969879, 0.1034012883901596, 0.11112268269062042, 0.11884407699108124, 0.12656547129154205, 0.13428685069084167, 0.1420082449913025, 0.1497296392917633, 0.15745103359222412, 0.16517242789268494, 0.17289380729198456, 0.18061520159244537, 0.1883365958929062, 0.1960579752922058, 0.20377936959266663, 0.21150076389312744, 0.21922215819358826, 0.22694355249404907, 0.2346649467945099, 0.2423863410949707, 0.2501077353954315, 0.25782912969589233, 0.26555052399635315, 0.27327191829681396, 0.2809932827949524, 0.2887147068977356, 0.296436071395874, 0.30415746569633484, 0.31187885999679565, 0.31960025429725647, 0.3273216485977173, 0.3350430428981781, 0.3427644371986389, 0.35048580169677734, 0.35820722579956055, 0.36592862010002136, 0.3736500144004822, 0.381371408700943, 0.3890928030014038, 0.3968141973018646, 0.40453559160232544, 0.41225695610046387, 0.4199783504009247]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 6.0, 10.0, 3.0, 16.0, 11.0, 23.0, 15.0, 19.0, 37.0, 35.0, 40.0, 35.0, 45.0, 45.0, 66.0, 47.0, 60.0, 52.0, 59.0, 60.0, 61.0, 48.0, 41.0, 36.0, 27.0, 23.0, 25.0, 16.0, 12.0, 13.0, 12.0, 6.0, 4.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0664941668510437, -0.06496723741292953, -0.06344031542539597, -0.0619133859872818, -0.06038646027445793, -0.058859534561634064, -0.0573326051235199, -0.05580567941069603, -0.05427875369787216, -0.052751827985048294, -0.051224902272224426, -0.04969797283411026, -0.04817104712128639, -0.046644121408462524, -0.04511719197034836, -0.04359026625752449, -0.04206334054470062, -0.040536414831876755, -0.03900948911905289, -0.03748255968093872, -0.03595563396811485, -0.034428708255290985, -0.03290177881717682, -0.03137485310435295, -0.029847927391529083, -0.028321001678705215, -0.0267940741032362, -0.02526714652776718, -0.023740220814943314, -0.022213295102119446, -0.02068636752665043, -0.019159439951181412, -0.017632514238357544, -0.016105588525533676, -0.014578660950064659, -0.013051734305918217, -0.011524807661771774, -0.009997881017625332, -0.00847095437347889, -0.006944027729332447, -0.005417101085186005, -0.0038901744410395622, -0.00236324779689312, -0.0008363211527466774, 0.000690605491399765, 0.0022175321355462074, 0.00374445877969265, 0.005271385423839092, 0.006798312067985535, 0.008325238712131977, 0.00985216535627842, 0.011379092000424862, 0.012906018644571304, 0.014432945288717747, 0.01595987193286419, 0.017486799508333206, 0.019013725221157074, 0.020540650933980942, 0.02206757850944996, 0.023594506084918976, 0.025121431797742844, 0.02664835751056671, 0.02817528508603573, 0.029702212661504745, 0.031229138374328613]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 10.0, 14.0, 25.0, 36.0, 53.0, 125.0, 215.0, 527.0, 1987.0, 9753.0, 3838778.0, 335227.0, 5724.0, 1130.0, 337.0, 147.0, 75.0, 48.0, 28.0, 18.0, 17.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.038909912109375, -0.03751373291015625, -0.0361175537109375, -0.03472137451171875, -0.0333251953125, -0.03192901611328125, -0.0305328369140625, -0.02913665771484375, -0.027740478515625, -0.02634429931640625, -0.0249481201171875, -0.02355194091796875, -0.02215576171875, -0.02075958251953125, -0.0193634033203125, -0.01796722412109375, -0.016571044921875, -0.01517486572265625, -0.0137786865234375, -0.01238250732421875, -0.010986328125, -0.00959014892578125, -0.0081939697265625, -0.00679779052734375, -0.005401611328125, -0.00400543212890625, -0.0026092529296875, -0.00121307373046875, 0.00018310546875, 0.00157928466796875, 0.0029754638671875, 0.00437164306640625, 0.005767822265625, 0.00716400146484375, 0.0085601806640625, 0.00995635986328125, 0.0113525390625, 0.01274871826171875, 0.0141448974609375, 0.01554107666015625, 0.016937255859375, 0.01833343505859375, 0.0197296142578125, 0.02112579345703125, 0.02252197265625, 0.02391815185546875, 0.0253143310546875, 0.02671051025390625, 0.028106689453125, 0.02950286865234375, 0.0308990478515625, 0.03229522705078125, 0.03369140625, 0.03508758544921875, 0.0364837646484375, 0.03787994384765625, 0.039276123046875, 0.04067230224609375, 0.0420684814453125, 0.04346466064453125, 0.04486083984375, 0.04625701904296875, 0.0476531982421875, 0.04904937744140625, 0.050445556640625]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 41.0, 74.0, 163.0, 210.0, 243.0, 149.0, 74.0, 20.0, 13.0, 7.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0213775634765625, -0.020686864852905273, -0.019996166229248047, -0.01930546760559082, -0.018614768981933594, -0.017924070358276367, -0.01723337173461914, -0.016542673110961914, -0.015851974487304688, -0.015161275863647461, -0.014470577239990234, -0.013779878616333008, -0.013089179992675781, -0.012398481369018555, -0.011707782745361328, -0.011017084121704102, -0.010326385498046875, -0.009635686874389648, -0.008944988250732422, -0.008254289627075195, -0.007563591003417969, -0.006872892379760742, -0.006182193756103516, -0.005491495132446289, -0.0048007965087890625, -0.004110097885131836, -0.0034193992614746094, -0.002728700637817383, -0.0020380020141601562, -0.0013473033905029297, -0.0006566047668457031, 3.409385681152344e-05, 0.00072479248046875, 0.0014154911041259766, 0.002106189727783203, 0.0027968883514404297, 0.0034875869750976562, 0.004178285598754883, 0.004868984222412109, 0.005559682846069336, 0.0062503814697265625, 0.006941080093383789, 0.007631778717041016, 0.008322477340698242, 0.009013175964355469, 0.009703874588012695, 0.010394573211669922, 0.011085271835327148, 0.011775970458984375, 0.012466669082641602, 0.013157367706298828, 0.013848066329956055, 0.014538764953613281, 0.015229463577270508, 0.015920162200927734, 0.01661086082458496, 0.017301559448242188, 0.017992258071899414, 0.01868295669555664, 0.019373655319213867, 0.020064353942871094, 0.02075505256652832, 0.021445751190185547, 0.022136449813842773, 0.0228271484375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 8.0, 9.0, 11.0, 18.0, 21.0, 22.0, 37.0, 64.0, 74.0, 106.0, 179.0, 274.0, 512.0, 990.0, 2571.0, 8595.0, 50704.0, 3526844.0, 566906.0, 26932.0, 5580.0, 1860.0, 816.0, 441.0, 215.0, 140.0, 90.0, 56.0, 50.0, 48.0, 24.0, 14.0, 13.0, 10.0, 5.0, 8.0, 7.0, 3.0, 5.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.0223236083984375, -0.02170085906982422, -0.021078109741210938, -0.020455360412597656, -0.019832611083984375, -0.019209861755371094, -0.018587112426757812, -0.01796436309814453, -0.01734161376953125, -0.01671886444091797, -0.016096115112304688, -0.015473365783691406, -0.014850616455078125, -0.014227867126464844, -0.013605117797851562, -0.012982368469238281, -0.012359619140625, -0.011736869812011719, -0.011114120483398438, -0.010491371154785156, -0.009868621826171875, -0.009245872497558594, -0.008623123168945312, -0.008000373840332031, -0.00737762451171875, -0.006754875183105469, -0.0061321258544921875, -0.005509376525878906, -0.004886627197265625, -0.004263877868652344, -0.0036411285400390625, -0.0030183792114257812, -0.0023956298828125, -0.0017728805541992188, -0.0011501312255859375, -0.0005273818969726562, 9.5367431640625e-05, 0.0007181167602539062, 0.0013408660888671875, 0.0019636154174804688, 0.00258636474609375, 0.0032091140747070312, 0.0038318634033203125, 0.004454612731933594, 0.005077362060546875, 0.005700111389160156, 0.0063228607177734375, 0.006945610046386719, 0.007568359375, 0.008191108703613281, 0.008813858032226562, 0.009436607360839844, 0.010059356689453125, 0.010682106018066406, 0.011304855346679688, 0.011927604675292969, 0.01255035400390625, 0.013173103332519531, 0.013795852661132812, 0.014418601989746094, 0.015041351318359375, 0.015664100646972656, 0.016286849975585938, 0.01690959930419922, 0.0175323486328125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 12.0, 25.0, 60.0, 192.0, 1130.0, 2154.0, 303.0, 99.0, 36.0, 25.0, 14.0, 11.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.030609130859375, -0.029846906661987305, -0.02908468246459961, -0.028322458267211914, -0.02756023406982422, -0.026798009872436523, -0.026035785675048828, -0.025273561477661133, -0.024511337280273438, -0.023749113082885742, -0.022986888885498047, -0.02222466468811035, -0.021462440490722656, -0.02070021629333496, -0.019937992095947266, -0.01917576789855957, -0.018413543701171875, -0.01765131950378418, -0.016889095306396484, -0.01612687110900879, -0.015364646911621094, -0.014602422714233398, -0.013840198516845703, -0.013077974319458008, -0.012315750122070312, -0.011553525924682617, -0.010791301727294922, -0.010029077529907227, -0.009266853332519531, -0.008504629135131836, -0.007742404937744141, -0.006980180740356445, -0.00621795654296875, -0.005455732345581055, -0.004693508148193359, -0.003931283950805664, -0.0031690597534179688, -0.0024068355560302734, -0.0016446113586425781, -0.0008823871612548828, -0.0001201629638671875, 0.0006420612335205078, 0.0014042854309082031, 0.0021665096282958984, 0.0029287338256835938, 0.003690958023071289, 0.004453182220458984, 0.00521540641784668, 0.005977630615234375, 0.00673985481262207, 0.007502079010009766, 0.008264303207397461, 0.009026527404785156, 0.009788751602172852, 0.010550975799560547, 0.011313199996948242, 0.012075424194335938, 0.012837648391723633, 0.013599872589111328, 0.014362096786499023, 0.015124320983886719, 0.015886545181274414, 0.01664876937866211, 0.017410993576049805, 0.0181732177734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 7.0, 33.0, 93.0, 240.0, 354.0, 191.0, 53.0, 24.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.15923556685447693, -0.15571248531341553, -0.15218941867351532, -0.14866633713245392, -0.1451432704925537, -0.1416201889514923, -0.1380971223115921, -0.1345740407705307, -0.1310509741306305, -0.1275278925895691, -0.12400482594966888, -0.12048175185918808, -0.11695867776870728, -0.11343559622764587, -0.10991252213716507, -0.10638944804668427, -0.10286636650562286, -0.09934329241514206, -0.09582021832466125, -0.09229714423418045, -0.08877407014369965, -0.08525098860263824, -0.08172791451215744, -0.07820484042167664, -0.07468176633119583, -0.07115869224071503, -0.06763561815023422, -0.06411254405975342, -0.060589466243982315, -0.05706639215350151, -0.05354331433773041, -0.0500202402472496, -0.0464971587061882, -0.0429740846157074, -0.03945101052522659, -0.03592793270945549, -0.032404858618974686, -0.02888178452849388, -0.025358708575367928, -0.021835632622241974, -0.01831255853176117, -0.01478948350995779, -0.011266408488154411, -0.007743333466351032, -0.004220258444547653, -0.0006971843540668488, 0.002825891599059105, 0.006348967552185059, 0.009872041642665863, 0.013395116664469242, 0.01691819168627262, 0.020441267639398575, 0.02396434172987938, 0.027487415820360184, 0.031010491773486137, 0.03453356772661209, 0.038056641817092896, 0.0415797159075737, 0.045102789998054504, 0.04862586781382561, 0.05214894190430641, 0.055672015994787216, 0.05919509381055832, 0.06271816790103912, 0.06624124199151993]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 2.0, 4.0, 8.0, 11.0, 10.0, 10.0, 10.0, 16.0, 21.0, 20.0, 32.0, 34.0, 34.0, 38.0, 49.0, 54.0, 55.0, 50.0, 51.0, 52.0, 61.0, 46.0, 33.0, 43.0, 46.0, 38.0, 22.0, 26.0, 24.0, 21.0, 19.0, 11.0, 14.0, 6.0, 11.0, 3.0, 2.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.030446171760559082, -0.029427191242575645, -0.02840821072459221, -0.027389230206608772, -0.026370249688625336, -0.0253512691706419, -0.024332288652658463, -0.023313308134675026, -0.02229432761669159, -0.021275347098708153, -0.020256366580724716, -0.01923738606274128, -0.018218405544757843, -0.017199425026774406, -0.01618044450879097, -0.015161463990807533, -0.014142483472824097, -0.01312350295484066, -0.012104522436857224, -0.011085541918873787, -0.01006656140089035, -0.009047580882906914, -0.008028600364923477, -0.007009619846940041, -0.005990639328956604, -0.004971658810973167, -0.003952678292989731, -0.0029336977750062943, -0.0019147172570228577, -0.0008957367390394211, 0.0001232437789440155, 0.001142224296927452, 0.0021612048149108887, 0.0031801853328943253, 0.004199165850877762, 0.005218146368861198, 0.006237126886844635, 0.007256107404828072, 0.008275087922811508, 0.009294068440794945, 0.010313048958778381, 0.011332029476761818, 0.012351009994745255, 0.013369990512728691, 0.014388971030712128, 0.015407951548695564, 0.016426932066679, 0.017445912584662437, 0.018464893102645874, 0.01948387362062931, 0.020502854138612747, 0.021521834656596184, 0.02254081517457962, 0.023559795692563057, 0.024578776210546494, 0.02559775672852993, 0.026616737246513367, 0.027635717764496803, 0.02865469828248024, 0.029673678800463676, 0.030692659318447113, 0.0317116379737854, 0.032730620354413986, 0.03374960273504257, 0.03476858139038086]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 12.0, 10.0, 9.0, 19.0, 21.0, 30.0, 42.0, 61.0, 86.0, 119.0, 191.0, 265.0, 395.0, 634.0, 1226.0, 3076.0, 14872.0, 336185.0, 656943.0, 26592.0, 4144.0, 1468.0, 708.0, 465.0, 293.0, 224.0, 141.0, 71.0, 72.0, 47.0, 39.0, 29.0, 13.0, 13.0, 10.0, 4.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.024261474609375, -0.023366928100585938, -0.022472381591796875, -0.021577835083007812, -0.02068328857421875, -0.019788742065429688, -0.018894195556640625, -0.017999649047851562, -0.0171051025390625, -0.016210556030273438, -0.015316009521484375, -0.014421463012695312, -0.01352691650390625, -0.012632369995117188, -0.011737823486328125, -0.010843276977539062, -0.00994873046875, -0.009054183959960938, -0.008159637451171875, -0.0072650909423828125, -0.00637054443359375, -0.0054759979248046875, -0.004581451416015625, -0.0036869049072265625, -0.0027923583984375, -0.0018978118896484375, -0.001003265380859375, -0.0001087188720703125, 0.00078582763671875, 0.0016803741455078125, 0.002574920654296875, 0.0034694671630859375, 0.004364013671875, 0.0052585601806640625, 0.006153106689453125, 0.0070476531982421875, 0.00794219970703125, 0.008836746215820312, 0.009731292724609375, 0.010625839233398438, 0.0115203857421875, 0.012414932250976562, 0.013309478759765625, 0.014204025268554688, 0.01509857177734375, 0.015993118286132812, 0.016887664794921875, 0.017782211303710938, 0.0186767578125, 0.019571304321289062, 0.020465850830078125, 0.021360397338867188, 0.02225494384765625, 0.023149490356445312, 0.024044036865234375, 0.024938583374023438, 0.0258331298828125, 0.026727676391601562, 0.027622222900390625, 0.028516769409179688, 0.02941131591796875, 0.030305862426757812, 0.031200408935546875, 0.03209495544433594, 0.032989501953125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 8.0, 28.0, 85.0, 170.0, 227.0, 224.0, 149.0, 70.0, 21.0, 16.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02288818359375, -0.022147417068481445, -0.02140665054321289, -0.020665884017944336, -0.01992511749267578, -0.019184350967407227, -0.018443584442138672, -0.017702817916870117, -0.016962051391601562, -0.016221284866333008, -0.015480518341064453, -0.014739751815795898, -0.013998985290527344, -0.013258218765258789, -0.012517452239990234, -0.01177668571472168, -0.011035919189453125, -0.01029515266418457, -0.009554386138916016, -0.008813619613647461, -0.008072853088378906, -0.0073320865631103516, -0.006591320037841797, -0.005850553512573242, -0.0051097869873046875, -0.004369020462036133, -0.003628253936767578, -0.0028874874114990234, -0.0021467208862304688, -0.001405954360961914, -0.0006651878356933594, 7.557868957519531e-05, 0.00081634521484375, 0.0015571117401123047, 0.0022978782653808594, 0.003038644790649414, 0.0037794113159179688, 0.0045201778411865234, 0.005260944366455078, 0.006001710891723633, 0.0067424774169921875, 0.007483243942260742, 0.008224010467529297, 0.008964776992797852, 0.009705543518066406, 0.010446310043334961, 0.011187076568603516, 0.01192784309387207, 0.012668609619140625, 0.01340937614440918, 0.014150142669677734, 0.014890909194946289, 0.015631675720214844, 0.0163724422454834, 0.017113208770751953, 0.017853975296020508, 0.018594741821289062, 0.019335508346557617, 0.020076274871826172, 0.020817041397094727, 0.02155780792236328, 0.022298574447631836, 0.02303934097290039, 0.023780107498168945, 0.0245208740234375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 5.0, 2.0, 5.0, 3.0, 5.0, 7.0, 5.0, 15.0, 24.0, 20.0, 31.0, 49.0, 62.0, 121.0, 201.0, 383.0, 742.0, 1494.0, 3302.0, 7800.0, 21052.0, 66192.0, 238427.0, 448168.0, 180973.0, 50781.0, 16766.0, 6365.0, 2882.0, 1229.0, 621.0, 315.0, 189.0, 95.0, 58.0, 43.0, 28.0, 22.0, 20.0, 16.0, 12.0, 13.0, 9.0, 5.0, 3.0, 1.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.01198577880859375, -0.0116652250289917, -0.011344671249389648, -0.011024117469787598, -0.010703563690185547, -0.010383009910583496, -0.010062456130981445, -0.009741902351379395, -0.009421348571777344, -0.009100794792175293, -0.008780241012573242, -0.008459687232971191, -0.00813913345336914, -0.00781857967376709, -0.007498025894165039, -0.007177472114562988, -0.0068569183349609375, -0.006536364555358887, -0.006215810775756836, -0.005895256996154785, -0.005574703216552734, -0.005254149436950684, -0.004933595657348633, -0.004613041877746582, -0.004292488098144531, -0.0039719343185424805, -0.0036513805389404297, -0.003330826759338379, -0.003010272979736328, -0.0026897192001342773, -0.0023691654205322266, -0.0020486116409301758, -0.001728057861328125, -0.0014075040817260742, -0.0010869503021240234, -0.0007663965225219727, -0.0004458427429199219, -0.0001252889633178711, 0.0001952648162841797, 0.0005158185958862305, 0.0008363723754882812, 0.001156926155090332, 0.0014774799346923828, 0.0017980337142944336, 0.0021185874938964844, 0.002439141273498535, 0.002759695053100586, 0.0030802488327026367, 0.0034008026123046875, 0.0037213563919067383, 0.004041910171508789, 0.00436246395111084, 0.004683017730712891, 0.005003571510314941, 0.005324125289916992, 0.005644679069519043, 0.005965232849121094, 0.0062857866287231445, 0.006606340408325195, 0.006926894187927246, 0.007247447967529297, 0.007568001747131348, 0.007888555526733398, 0.00820910930633545, 0.0085296630859375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 8.0, 10.0, 9.0, 12.0, 10.0, 13.0, 22.0, 27.0, 25.0, 24.0, 18.0, 25.0, 40.0, 51.0, 38.0, 52.0, 53.0, 54.0, 52.0, 36.0, 41.0, 49.0, 44.0, 31.0, 28.0, 38.0, 25.0, 25.0, 24.0, 25.0, 17.0, 18.0, 12.0, 8.0, 9.0, 4.0, 5.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01180267333984375, -0.011354565620422363, -0.010906457901000977, -0.01045835018157959, -0.010010242462158203, -0.009562134742736816, -0.00911402702331543, -0.008665919303894043, -0.008217811584472656, -0.0077697038650512695, -0.007321596145629883, -0.006873488426208496, -0.006425380706787109, -0.005977272987365723, -0.005529165267944336, -0.005081057548522949, -0.0046329498291015625, -0.004184842109680176, -0.003736734390258789, -0.0032886266708374023, -0.0028405189514160156, -0.002392411231994629, -0.0019443035125732422, -0.0014961957931518555, -0.0010480880737304688, -0.000599980354309082, -0.0001518726348876953, 0.0002962350845336914, 0.0007443428039550781, 0.0011924505233764648, 0.0016405582427978516, 0.0020886659622192383, 0.002536773681640625, 0.0029848814010620117, 0.0034329891204833984, 0.003881096839904785, 0.004329204559326172, 0.004777312278747559, 0.005225419998168945, 0.005673527717590332, 0.006121635437011719, 0.0065697431564331055, 0.007017850875854492, 0.007465958595275879, 0.007914066314697266, 0.008362174034118652, 0.008810281753540039, 0.009258389472961426, 0.009706497192382812, 0.0101546049118042, 0.010602712631225586, 0.011050820350646973, 0.01149892807006836, 0.011947035789489746, 0.012395143508911133, 0.01284325122833252, 0.013291358947753906, 0.013739466667175293, 0.01418757438659668, 0.014635682106018066, 0.015083789825439453, 0.01553189754486084, 0.015980005264282227, 0.016428112983703613, 0.016876220703125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 4.0, 1.0, 11.0, 10.0, 8.0, 15.0, 28.0, 24.0, 43.0, 78.0, 118.0, 202.0, 378.0, 749.0, 1541.0, 3494.0, 8261.0, 21647.0, 67530.0, 279241.0, 470954.0, 134020.0, 37216.0, 13029.0, 5278.0, 2364.0, 1080.0, 537.0, 264.0, 160.0, 99.0, 44.0, 33.0, 27.0, 11.0, 16.0, 15.0, 7.0, 3.0, 6.0, 1.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0035610198974609375, -0.003439277410507202, -0.003317534923553467, -0.0031957924365997314, -0.003074049949645996, -0.0029523074626922607, -0.0028305649757385254, -0.00270882248878479, -0.0025870800018310547, -0.0024653375148773193, -0.002343595027923584, -0.0022218525409698486, -0.0021001100540161133, -0.001978367567062378, -0.0018566250801086426, -0.0017348825931549072, -0.0016131401062011719, -0.0014913976192474365, -0.0013696551322937012, -0.0012479126453399658, -0.0011261701583862305, -0.0010044276714324951, -0.0008826851844787598, -0.0007609426975250244, -0.0006392002105712891, -0.0005174577236175537, -0.00039571523666381836, -0.000273972749710083, -0.00015223026275634766, -3.0487775802612305e-05, 9.125471115112305e-05, 0.0002129971981048584, 0.00033473968505859375, 0.0004564821720123291, 0.0005782246589660645, 0.0006999671459197998, 0.0008217096328735352, 0.0009434521198272705, 0.0010651946067810059, 0.0011869370937347412, 0.0013086795806884766, 0.001430422067642212, 0.0015521645545959473, 0.0016739070415496826, 0.001795649528503418, 0.0019173920154571533, 0.0020391345024108887, 0.002160876989364624, 0.0022826194763183594, 0.0024043619632720947, 0.00252610445022583, 0.0026478469371795654, 0.0027695894241333008, 0.002891331911087036, 0.0030130743980407715, 0.003134816884994507, 0.003256559371948242, 0.0033783018589019775, 0.003500044345855713, 0.0036217868328094482, 0.0037435293197631836, 0.003865271806716919, 0.003987014293670654, 0.00410875678062439, 0.004230499267578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 10.0, 11.0, 16.0, 15.0, 10.0, 21.0, 20.0, 16.0, 21.0, 23.0, 43.0, 51.0, 45.0, 66.0, 97.0, 96.0, 74.0, 69.0, 48.0, 26.0, 42.0, 28.0, 25.0, 17.0, 20.0, 11.0, 15.0, 6.0, 7.0, 9.0, 9.0, 3.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.744529724121094e-05, -4.574749618768692e-05, -4.40496951341629e-05, -4.2351894080638885e-05, -4.065409302711487e-05, -3.895629197359085e-05, -3.7258490920066833e-05, -3.5560689866542816e-05, -3.38628888130188e-05, -3.216508775949478e-05, -3.0467286705970764e-05, -2.8769485652446747e-05, -2.707168459892273e-05, -2.5373883545398712e-05, -2.3676082491874695e-05, -2.1978281438350677e-05, -2.028048038482666e-05, -1.8582679331302643e-05, -1.6884878277778625e-05, -1.5187077224254608e-05, -1.348927617073059e-05, -1.1791475117206573e-05, -1.0093674063682556e-05, -8.395873010158539e-06, -6.6980719566345215e-06, -5.000270903110504e-06, -3.302469849586487e-06, -1.6046687960624695e-06, 9.313225746154785e-08, 1.7909333109855652e-06, 3.4887343645095825e-06, 5.1865354180336e-06, 6.884336471557617e-06, 8.582137525081635e-06, 1.0279938578605652e-05, 1.197773963212967e-05, 1.3675540685653687e-05, 1.5373341739177704e-05, 1.707114279270172e-05, 1.876894384622574e-05, 2.0466744899749756e-05, 2.2164545953273773e-05, 2.386234700679779e-05, 2.5560148060321808e-05, 2.7257949113845825e-05, 2.8955750167369843e-05, 3.065355122089386e-05, 3.235135227441788e-05, 3.4049153327941895e-05, 3.574695438146591e-05, 3.744475543498993e-05, 3.9142556488513947e-05, 4.0840357542037964e-05, 4.253815859556198e-05, 4.4235959649086e-05, 4.5933760702610016e-05, 4.763156175613403e-05, 4.932936280965805e-05, 5.102716386318207e-05, 5.2724964916706085e-05, 5.44227659702301e-05, 5.612056702375412e-05, 5.781836807727814e-05, 5.9516169130802155e-05, 6.121397018432617e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 7.0, 3.0, 7.0, 6.0, 3.0, 15.0, 11.0, 29.0, 45.0, 87.0, 101.0, 190.0, 394.0, 719.0, 1527.0, 3031.0, 6624.0, 15961.0, 42908.0, 144984.0, 469889.0, 254254.0, 67363.0, 22933.0, 9296.0, 4157.0, 1994.0, 886.0, 466.0, 280.0, 134.0, 97.0, 58.0, 29.0, 25.0, 13.0, 13.0, 12.0, 2.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004207611083984375, -0.004086345434188843, -0.0039650797843933105, -0.0038438141345977783, -0.003722548484802246, -0.003601282835006714, -0.0034800171852111816, -0.0033587515354156494, -0.003237485885620117, -0.003116220235824585, -0.0029949545860290527, -0.0028736889362335205, -0.0027524232864379883, -0.002631157636642456, -0.002509891986846924, -0.0023886263370513916, -0.0022673606872558594, -0.002146095037460327, -0.002024829387664795, -0.0019035637378692627, -0.0017822980880737305, -0.0016610324382781982, -0.001539766788482666, -0.0014185011386871338, -0.0012972354888916016, -0.0011759698390960693, -0.0010547041893005371, -0.0009334385395050049, -0.0008121728897094727, -0.0006909072399139404, -0.0005696415901184082, -0.000448375940322876, -0.00032711029052734375, -0.00020584464073181152, -8.45789909362793e-05, 3.668665885925293e-05, 0.00015795230865478516, 0.0002792179584503174, 0.0004004836082458496, 0.0005217492580413818, 0.0006430149078369141, 0.0007642805576324463, 0.0008855462074279785, 0.0010068118572235107, 0.001128077507019043, 0.0012493431568145752, 0.0013706088066101074, 0.0014918744564056396, 0.0016131401062011719, 0.001734405755996704, 0.0018556714057922363, 0.0019769370555877686, 0.0020982027053833008, 0.002219468355178833, 0.0023407340049743652, 0.0024619996547698975, 0.0025832653045654297, 0.002704530954360962, 0.002825796604156494, 0.0029470622539520264, 0.0030683279037475586, 0.003189593553543091, 0.003310859203338623, 0.0034321248531341553, 0.0035533905029296875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 0.0, 6.0, 3.0, 5.0, 4.0, 8.0, 4.0, 7.0, 6.0, 14.0, 22.0, 23.0, 23.0, 22.0, 38.0, 36.0, 56.0, 55.0, 79.0, 104.0, 73.0, 76.0, 67.0, 62.0, 43.0, 28.0, 25.0, 21.0, 12.0, 18.0, 14.0, 10.0, 8.0, 6.0, 5.0, 8.0, 4.0, 5.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0], "bins": [-0.0037441253662109375, -0.003643631935119629, -0.0035431385040283203, -0.0034426450729370117, -0.003342151641845703, -0.0032416582107543945, -0.003141164779663086, -0.0030406713485717773, -0.0029401779174804688, -0.00283968448638916, -0.0027391910552978516, -0.002638697624206543, -0.0025382041931152344, -0.0024377107620239258, -0.002337217330932617, -0.0022367238998413086, -0.00213623046875, -0.0020357370376586914, -0.0019352436065673828, -0.0018347501754760742, -0.0017342567443847656, -0.001633763313293457, -0.0015332698822021484, -0.0014327764511108398, -0.0013322830200195312, -0.0012317895889282227, -0.001131296157836914, -0.0010308027267456055, -0.0009303092956542969, -0.0008298158645629883, -0.0007293224334716797, -0.0006288290023803711, -0.0005283355712890625, -0.0004278421401977539, -0.0003273487091064453, -0.00022685527801513672, -0.00012636184692382812, -2.586841583251953e-05, 7.462501525878906e-05, 0.00017511844635009766, 0.00027561187744140625, 0.00037610530853271484, 0.00047659873962402344, 0.000577092170715332, 0.0006775856018066406, 0.0007780790328979492, 0.0008785724639892578, 0.0009790658950805664, 0.001079559326171875, 0.0011800527572631836, 0.0012805461883544922, 0.0013810396194458008, 0.0014815330505371094, 0.001582026481628418, 0.0016825199127197266, 0.0017830133438110352, 0.0018835067749023438, 0.0019840002059936523, 0.002084493637084961, 0.0021849870681762695, 0.002285480499267578, 0.0023859739303588867, 0.0024864673614501953, 0.002586960792541504, 0.0026874542236328125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 5.0, 10.0, 16.0, 25.0, 61.0, 113.0, 180.0, 214.0, 164.0, 96.0, 55.0, 31.0, 16.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06902939081192017, -0.06695427745580673, -0.0648791640996933, -0.06280405074357986, -0.06072893366217613, -0.0586538203060627, -0.056578706949949265, -0.05450359359383583, -0.0524284765124321, -0.050353363156318665, -0.04827824980020523, -0.0462031364440918, -0.044128019362688065, -0.04205290600657463, -0.0399777926504612, -0.03790267929434776, -0.03582756593823433, -0.033752452582120895, -0.03167733922600746, -0.02960222400724888, -0.027527108788490295, -0.02545199543237686, -0.023376882076263428, -0.021301768720149994, -0.01922665350139141, -0.017151540145277977, -0.015076424926519394, -0.01300131157040596, -0.010926197282969952, -0.008851082995533943, -0.006775969639420509, -0.004700855351984501, -0.0026257410645484924, -0.0005506270099431276, 0.0015244870446622372, 0.0035996008664369583, 0.005674715153872967, 0.007749829441308975, 0.009824942797422409, 0.011900057084858418, 0.013975171372294426, 0.01605028472840786, 0.018125399947166443, 0.020200513303279877, 0.02227562665939331, 0.024350741878151894, 0.026425855234265327, 0.02850097045302391, 0.030576083809137344, 0.03265119716525078, 0.03472631052136421, 0.036801427602767944, 0.03887654095888138, 0.04095165431499481, 0.043026767671108246, 0.04510188102722168, 0.047176994383335114, 0.04925210773944855, 0.05132722109556198, 0.053402334451675415, 0.05547745153307915, 0.05755256488919258, 0.059627678245306015, 0.06170279160141945, 0.06377790868282318]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 1.0, 1.0, 6.0, 5.0, 3.0, 4.0, 4.0, 7.0, 4.0, 3.0, 10.0, 11.0, 12.0, 14.0, 18.0, 14.0, 17.0, 16.0, 26.0, 29.0, 24.0, 27.0, 37.0, 37.0, 36.0, 29.0, 39.0, 32.0, 43.0, 40.0, 36.0, 29.0, 37.0, 28.0, 34.0, 29.0, 33.0, 31.0, 30.0, 21.0, 26.0, 26.0, 12.0, 12.0, 13.0, 11.0, 8.0, 7.0, 8.0, 7.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.030870914459228516, -0.02988198772072792, -0.028893062844872475, -0.02790413796901703, -0.026915211230516434, -0.02592628449201584, -0.024937359616160393, -0.023948434740304947, -0.022959508001804352, -0.021970581263303757, -0.02098165638744831, -0.019992731511592865, -0.01900380477309227, -0.018014878034591675, -0.01702595315873623, -0.016037028282880783, -0.015048101544380188, -0.014059175737202168, -0.013070249930024147, -0.012081324122846127, -0.011092398315668106, -0.010103472508490086, -0.009114546701312065, -0.008125620894134045, -0.007136695086956024, -0.006147769279778004, -0.005158843472599983, -0.004169917665421963, -0.0031809918582439423, -0.002192066051065922, -0.0012031402438879013, -0.00021421443670988083, 0.0007747113704681396, 0.0017636371776461601, 0.0027525629848241806, 0.003741488792002201, 0.0047304145991802216, 0.005719340406358242, 0.0067082662135362625, 0.007697192020714283, 0.008686117827892303, 0.009675043635070324, 0.010663969442248344, 0.011652895249426365, 0.012641821056604385, 0.013630746863782406, 0.014619672670960426, 0.015608598478138447, 0.016597524285316467, 0.017586451023817062, 0.018575375899672508, 0.019564300775527954, 0.02055322751402855, 0.021542154252529144, 0.02253107912838459, 0.023520004004240036, 0.02450893074274063, 0.025497857481241226, 0.026486782357096672, 0.027475707232952118, 0.028464633971452713, 0.029453560709953308, 0.030442485585808754, 0.0314314104616642, 0.032420337200164795]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 8.0, 19.0, 23.0, 54.0, 121.0, 336.0, 780.0, 4251.0, 51193.0, 4116289.0, 18251.0, 2009.0, 523.0, 207.0, 115.0, 32.0, 25.0, 17.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.052398681640625, -0.0506134033203125, -0.048828125, -0.0470428466796875, -0.045257568359375, -0.0434722900390625, -0.04168701171875, -0.0399017333984375, -0.038116455078125, -0.0363311767578125, -0.0345458984375, -0.0327606201171875, -0.030975341796875, -0.0291900634765625, -0.02740478515625, -0.0256195068359375, -0.023834228515625, -0.0220489501953125, -0.020263671875, -0.0184783935546875, -0.016693115234375, -0.0149078369140625, -0.01312255859375, -0.0113372802734375, -0.009552001953125, -0.0077667236328125, -0.0059814453125, -0.0041961669921875, -0.002410888671875, -0.0006256103515625, 0.00115966796875, 0.0029449462890625, 0.004730224609375, 0.0065155029296875, 0.00830078125, 0.0100860595703125, 0.011871337890625, 0.0136566162109375, 0.01544189453125, 0.0172271728515625, 0.019012451171875, 0.0207977294921875, 0.0225830078125, 0.0243682861328125, 0.026153564453125, 0.0279388427734375, 0.02972412109375, 0.0315093994140625, 0.033294677734375, 0.0350799560546875, 0.036865234375, 0.0386505126953125, 0.040435791015625, 0.0422210693359375, 0.04400634765625, 0.0457916259765625, 0.047576904296875, 0.0493621826171875, 0.0511474609375, 0.0529327392578125, 0.054718017578125, 0.0565032958984375, 0.05828857421875, 0.0600738525390625, 0.061859130859375]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 24.0, 75.0, 155.0, 198.0, 233.0, 176.0, 84.0, 39.0, 12.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0224456787109375, -0.021700620651245117, -0.020955562591552734, -0.02021050453186035, -0.01946544647216797, -0.018720388412475586, -0.017975330352783203, -0.01723027229309082, -0.016485214233398438, -0.015740156173706055, -0.014995098114013672, -0.014250040054321289, -0.013504981994628906, -0.012759923934936523, -0.01201486587524414, -0.011269807815551758, -0.010524749755859375, -0.009779691696166992, -0.00903463363647461, -0.008289575576782227, -0.007544517517089844, -0.006799459457397461, -0.006054401397705078, -0.005309343338012695, -0.0045642852783203125, -0.0038192272186279297, -0.003074169158935547, -0.002329111099243164, -0.0015840530395507812, -0.0008389949798583984, -9.393692016601562e-05, 0.0006511211395263672, 0.00139617919921875, 0.002141237258911133, 0.0028862953186035156, 0.0036313533782958984, 0.004376411437988281, 0.005121469497680664, 0.005866527557373047, 0.00661158561706543, 0.0073566436767578125, 0.008101701736450195, 0.008846759796142578, 0.009591817855834961, 0.010336875915527344, 0.011081933975219727, 0.01182699203491211, 0.012572050094604492, 0.013317108154296875, 0.014062166213989258, 0.01480722427368164, 0.015552282333374023, 0.016297340393066406, 0.01704239845275879, 0.017787456512451172, 0.018532514572143555, 0.019277572631835938, 0.02002263069152832, 0.020767688751220703, 0.021512746810913086, 0.02225780487060547, 0.02300286293029785, 0.023747920989990234, 0.024492979049682617, 0.025238037109375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 6.0, 9.0, 4.0, 10.0, 17.0, 23.0, 42.0, 51.0, 92.0, 141.0, 227.0, 326.0, 510.0, 922.0, 1647.0, 3293.0, 7966.0, 25473.0, 130696.0, 3162229.0, 767582.0, 65780.0, 15811.0, 5537.0, 2516.0, 1350.0, 740.0, 445.0, 291.0, 182.0, 124.0, 87.0, 46.0, 28.0, 17.0, 20.0, 11.0, 8.0, 12.0, 3.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0119781494140625, -0.011576414108276367, -0.011174678802490234, -0.010772943496704102, -0.010371208190917969, -0.009969472885131836, -0.009567737579345703, -0.00916600227355957, -0.008764266967773438, -0.008362531661987305, -0.007960796356201172, -0.007559061050415039, -0.007157325744628906, -0.0067555904388427734, -0.006353855133056641, -0.005952119827270508, -0.005550384521484375, -0.005148649215698242, -0.004746913909912109, -0.0043451786041259766, -0.003943443298339844, -0.003541707992553711, -0.003139972686767578, -0.0027382373809814453, -0.0023365020751953125, -0.0019347667694091797, -0.0015330314636230469, -0.001131296157836914, -0.0007295608520507812, -0.00032782554626464844, 7.390975952148438e-05, 0.0004756450653076172, 0.00087738037109375, 0.0012791156768798828, 0.0016808509826660156, 0.0020825862884521484, 0.0024843215942382812, 0.002886056900024414, 0.003287792205810547, 0.0036895275115966797, 0.0040912628173828125, 0.004492998123168945, 0.004894733428955078, 0.005296468734741211, 0.005698204040527344, 0.0060999393463134766, 0.006501674652099609, 0.006903409957885742, 0.007305145263671875, 0.007706880569458008, 0.00810861587524414, 0.008510351181030273, 0.008912086486816406, 0.009313821792602539, 0.009715557098388672, 0.010117292404174805, 0.010519027709960938, 0.01092076301574707, 0.011322498321533203, 0.011724233627319336, 0.012125968933105469, 0.012527704238891602, 0.012929439544677734, 0.013331174850463867, 0.01373291015625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 8.0, 7.0, 9.0, 23.0, 30.0, 52.0, 94.0, 169.0, 510.0, 1635.0, 987.0, 255.0, 119.0, 74.0, 40.0, 14.0, 15.0, 11.0, 4.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014495849609375, -0.013932943344116211, -0.013370037078857422, -0.012807130813598633, -0.012244224548339844, -0.011681318283081055, -0.011118412017822266, -0.010555505752563477, -0.009992599487304688, -0.009429693222045898, -0.00886678695678711, -0.00830388069152832, -0.007740974426269531, -0.007178068161010742, -0.006615161895751953, -0.006052255630493164, -0.005489349365234375, -0.004926443099975586, -0.004363536834716797, -0.003800630569458008, -0.0032377243041992188, -0.0026748180389404297, -0.0021119117736816406, -0.0015490055084228516, -0.0009860992431640625, -0.00042319297790527344, 0.00013971328735351562, 0.0007026195526123047, 0.0012655258178710938, 0.0018284320831298828, 0.002391338348388672, 0.002954244613647461, 0.00351715087890625, 0.004080057144165039, 0.004642963409423828, 0.005205869674682617, 0.005768775939941406, 0.006331682205200195, 0.006894588470458984, 0.0074574947357177734, 0.008020401000976562, 0.008583307266235352, 0.00914621353149414, 0.00970911979675293, 0.010272026062011719, 0.010834932327270508, 0.011397838592529297, 0.011960744857788086, 0.012523651123046875, 0.013086557388305664, 0.013649463653564453, 0.014212369918823242, 0.014775276184082031, 0.01533818244934082, 0.01590108871459961, 0.0164639949798584, 0.017026901245117188, 0.017589807510375977, 0.018152713775634766, 0.018715620040893555, 0.019278526306152344, 0.019841432571411133, 0.020404338836669922, 0.02096724510192871, 0.0215301513671875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 4.0, 17.0, 30.0, 76.0, 138.0, 241.0, 213.0, 134.0, 73.0, 40.0, 17.0, 6.0, 6.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05832286924123764, -0.055631037801504135, -0.05293920636177063, -0.050247374922037125, -0.04755554348230362, -0.044863712042570114, -0.04217188060283661, -0.039480045437812805, -0.0367882177233696, -0.03409638628363609, -0.03140455484390259, -0.028712723404169083, -0.026020891964435577, -0.023329060524702072, -0.020637227222323418, -0.017945395782589912, -0.015253562480211258, -0.012561731040477753, -0.009869899600744247, -0.007178067229688168, -0.004486235789954662, -0.001794404350221157, 0.0008974280208349228, 0.003589259460568428, 0.006281090900301933, 0.008972922340035439, 0.011664753779768944, 0.014356586150825024, 0.017048418521881104, 0.01974024996161461, 0.022432081401348114, 0.02512391284108162, 0.027815744280815125, 0.03050757572054863, 0.033199407160282135, 0.03589123860001564, 0.038583070039749146, 0.04127490147948265, 0.043966732919216156, 0.04665856808423996, 0.049350395798683167, 0.05204222723841667, 0.05473405867815018, 0.05742589011788368, 0.06011772155761719, 0.06280955672264099, 0.0655013844370842, 0.068193219602108, 0.07088504731655121, 0.07357688248157501, 0.07626871019601822, 0.07896054536104202, 0.08165237307548523, 0.08434420824050903, 0.08703603595495224, 0.08972787111997604, 0.09241970628499985, 0.09511154145002365, 0.09780336916446686, 0.10049520432949066, 0.10318703204393387, 0.10587886720895767, 0.10857069492340088, 0.11126253008842468, 0.11395435780286789]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 11.0, 8.0, 11.0, 9.0, 17.0, 17.0, 28.0, 22.0, 25.0, 26.0, 36.0, 39.0, 30.0, 49.0, 41.0, 43.0, 50.0, 54.0, 39.0, 63.0, 44.0, 59.0, 29.0, 32.0, 34.0, 25.0, 34.0, 17.0, 20.0, 23.0, 13.0, 16.0, 8.0, 5.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04069274663925171, -0.039581507444381714, -0.03847026452422142, -0.03735902160406113, -0.03624778240919113, -0.035136543214321136, -0.03402530029416084, -0.03291405737400055, -0.031802818179130554, -0.03069157712161541, -0.029580336064100266, -0.02846909500658512, -0.027357853949069977, -0.026246612891554832, -0.025135371834039688, -0.024024130776524544, -0.0229128897190094, -0.021801648661494255, -0.02069040760397911, -0.019579166546463966, -0.018467925488948822, -0.017356684431433678, -0.016245443373918533, -0.015134202316403389, -0.014022961258888245, -0.0129117202013731, -0.011800479143857956, -0.010689238086342812, -0.009577997028827667, -0.008466755971312523, -0.0073555149137973785, -0.006244273856282234, -0.00513303279876709, -0.0040217917412519455, -0.002910550683736801, -0.0017993096262216568, -0.0006880685687065125, 0.0004231724888086319, 0.0015344135463237762, 0.0026456546038389206, 0.003756895661354065, 0.004868136718869209, 0.005979377776384354, 0.007090618833899498, 0.008201859891414642, 0.009313100948929787, 0.010424342006444931, 0.011535583063960075, 0.01264682412147522, 0.013758065178990364, 0.014869306236505508, 0.015980547294020653, 0.017091788351535797, 0.01820302940905094, 0.019314270466566086, 0.02042551152408123, 0.021536752581596375, 0.02264799363911152, 0.023759234696626663, 0.024870475754141808, 0.025981716811656952, 0.027092957869172096, 0.02820419892668724, 0.029315439984202385, 0.03042668104171753]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 7.0, 13.0, 11.0, 15.0, 22.0, 21.0, 30.0, 35.0, 51.0, 90.0, 77.0, 140.0, 170.0, 243.0, 378.0, 611.0, 1162.0, 3244.0, 15635.0, 238326.0, 734470.0, 43670.0, 6099.0, 1755.0, 778.0, 452.0, 258.0, 200.0, 148.0, 93.0, 74.0, 70.0, 49.0, 41.0, 15.0, 21.0, 17.0, 11.0, 9.0, 11.0, 9.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0347900390625, -0.03374290466308594, -0.032695770263671875, -0.03164863586425781, -0.03060150146484375, -0.029554367065429688, -0.028507232666015625, -0.027460098266601562, -0.0264129638671875, -0.025365829467773438, -0.024318695068359375, -0.023271560668945312, -0.02222442626953125, -0.021177291870117188, -0.020130157470703125, -0.019083023071289062, -0.018035888671875, -0.016988754272460938, -0.015941619873046875, -0.014894485473632812, -0.01384735107421875, -0.012800216674804688, -0.011753082275390625, -0.010705947875976562, -0.0096588134765625, -0.008611679077148438, -0.007564544677734375, -0.0065174102783203125, -0.00547027587890625, -0.0044231414794921875, -0.003376007080078125, -0.0023288726806640625, -0.00128173828125, -0.0002346038818359375, 0.000812530517578125, 0.0018596649169921875, 0.00290679931640625, 0.0039539337158203125, 0.005001068115234375, 0.0060482025146484375, 0.0070953369140625, 0.008142471313476562, 0.009189605712890625, 0.010236740112304688, 0.01128387451171875, 0.012331008911132812, 0.013378143310546875, 0.014425277709960938, 0.015472412109375, 0.016519546508789062, 0.017566680908203125, 0.018613815307617188, 0.01966094970703125, 0.020708084106445312, 0.021755218505859375, 0.022802352905273438, 0.0238494873046875, 0.024896621704101562, 0.025943756103515625, 0.026990890502929688, 0.02803802490234375, 0.029085159301757812, 0.030132293701171875, 0.031179428100585938, 0.0322265625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 35.0, 68.0, 146.0, 188.0, 202.0, 169.0, 111.0, 44.0, 24.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0210113525390625, -0.020316600799560547, -0.019621849060058594, -0.01892709732055664, -0.018232345581054688, -0.017537593841552734, -0.01684284210205078, -0.016148090362548828, -0.015453338623046875, -0.014758586883544922, -0.014063835144042969, -0.013369083404541016, -0.012674331665039062, -0.01197957992553711, -0.011284828186035156, -0.010590076446533203, -0.00989532470703125, -0.009200572967529297, -0.008505821228027344, -0.007811069488525391, -0.0071163177490234375, -0.006421566009521484, -0.005726814270019531, -0.005032062530517578, -0.004337310791015625, -0.003642559051513672, -0.0029478073120117188, -0.0022530555725097656, -0.0015583038330078125, -0.0008635520935058594, -0.00016880035400390625, 0.0005259513854980469, 0.001220703125, 0.0019154548645019531, 0.0026102066040039062, 0.0033049583435058594, 0.0039997100830078125, 0.004694461822509766, 0.005389213562011719, 0.006083965301513672, 0.006778717041015625, 0.007473468780517578, 0.008168220520019531, 0.008862972259521484, 0.009557723999023438, 0.01025247573852539, 0.010947227478027344, 0.011641979217529297, 0.01233673095703125, 0.013031482696533203, 0.013726234436035156, 0.01442098617553711, 0.015115737915039062, 0.015810489654541016, 0.01650524139404297, 0.017199993133544922, 0.017894744873046875, 0.018589496612548828, 0.01928424835205078, 0.019979000091552734, 0.020673751831054688, 0.02136850357055664, 0.022063255310058594, 0.022758007049560547, 0.0234527587890625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 2.0, 5.0, 7.0, 5.0, 7.0, 13.0, 14.0, 17.0, 34.0, 36.0, 60.0, 81.0, 148.0, 260.0, 406.0, 820.0, 1622.0, 3749.0, 10417.0, 33717.0, 135550.0, 495573.0, 274823.0, 62592.0, 17707.0, 6021.0, 2423.0, 1073.0, 561.0, 281.0, 157.0, 125.0, 68.0, 49.0, 43.0, 20.0, 18.0, 13.0, 15.0, 6.0, 5.0, 2.0, 4.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.016937255859375, -0.01643514633178711, -0.01593303680419922, -0.015430927276611328, -0.014928817749023438, -0.014426708221435547, -0.013924598693847656, -0.013422489166259766, -0.012920379638671875, -0.012418270111083984, -0.011916160583496094, -0.011414051055908203, -0.010911941528320312, -0.010409832000732422, -0.009907722473144531, -0.00940561294555664, -0.00890350341796875, -0.00840139389038086, -0.007899284362792969, -0.007397174835205078, -0.0068950653076171875, -0.006392955780029297, -0.005890846252441406, -0.005388736724853516, -0.004886627197265625, -0.004384517669677734, -0.0038824081420898438, -0.003380298614501953, -0.0028781890869140625, -0.002376079559326172, -0.0018739700317382812, -0.0013718605041503906, -0.0008697509765625, -0.0003676414489746094, 0.00013446807861328125, 0.0006365776062011719, 0.0011386871337890625, 0.0016407966613769531, 0.0021429061889648438, 0.0026450157165527344, 0.003147125244140625, 0.0036492347717285156, 0.004151344299316406, 0.004653453826904297, 0.0051555633544921875, 0.005657672882080078, 0.006159782409667969, 0.006661891937255859, 0.00716400146484375, 0.007666110992431641, 0.008168220520019531, 0.008670330047607422, 0.009172439575195312, 0.009674549102783203, 0.010176658630371094, 0.010678768157958984, 0.011180877685546875, 0.011682987213134766, 0.012185096740722656, 0.012687206268310547, 0.013189315795898438, 0.013691425323486328, 0.014193534851074219, 0.01469564437866211, 0.01519775390625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 7.0, 6.0, 4.0, 6.0, 3.0, 12.0, 9.0, 17.0, 14.0, 14.0, 20.0, 25.0, 26.0, 30.0, 45.0, 47.0, 44.0, 27.0, 49.0, 43.0, 52.0, 30.0, 51.0, 37.0, 25.0, 49.0, 41.0, 26.0, 36.0, 30.0, 37.0, 24.0, 16.0, 19.0, 16.0, 18.0, 8.0, 11.0, 7.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0152740478515625, -0.014789342880249023, -0.014304637908935547, -0.01381993293762207, -0.013335227966308594, -0.012850522994995117, -0.01236581802368164, -0.011881113052368164, -0.011396408081054688, -0.010911703109741211, -0.010426998138427734, -0.009942293167114258, -0.009457588195800781, -0.008972883224487305, -0.008488178253173828, -0.008003473281860352, -0.007518768310546875, -0.0070340633392333984, -0.006549358367919922, -0.006064653396606445, -0.005579948425292969, -0.005095243453979492, -0.004610538482666016, -0.004125833511352539, -0.0036411285400390625, -0.003156423568725586, -0.0026717185974121094, -0.002187013626098633, -0.0017023086547851562, -0.0012176036834716797, -0.0007328987121582031, -0.00024819374084472656, 0.00023651123046875, 0.0007212162017822266, 0.0012059211730957031, 0.0016906261444091797, 0.0021753311157226562, 0.002660036087036133, 0.0031447410583496094, 0.003629446029663086, 0.0041141510009765625, 0.004598855972290039, 0.005083560943603516, 0.005568265914916992, 0.006052970886230469, 0.006537675857543945, 0.007022380828857422, 0.0075070858001708984, 0.007991790771484375, 0.008476495742797852, 0.008961200714111328, 0.009445905685424805, 0.009930610656738281, 0.010415315628051758, 0.010900020599365234, 0.011384725570678711, 0.011869430541992188, 0.012354135513305664, 0.01283884048461914, 0.013323545455932617, 0.013808250427246094, 0.01429295539855957, 0.014777660369873047, 0.015262365341186523, 0.0157470703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 5.0, 11.0, 5.0, 16.0, 12.0, 24.0, 46.0, 57.0, 85.0, 154.0, 232.0, 383.0, 785.0, 1462.0, 3226.0, 7610.0, 21042.0, 66557.0, 239735.0, 460548.0, 170848.0, 48274.0, 16042.0, 5964.0, 2676.0, 1232.0, 593.0, 353.0, 202.0, 111.0, 72.0, 63.0, 35.0, 27.0, 8.0, 18.0, 12.0, 10.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004596710205078125, -0.004440188407897949, -0.0042836666107177734, -0.004127144813537598, -0.003970623016357422, -0.003814101219177246, -0.0036575794219970703, -0.0035010576248168945, -0.0033445358276367188, -0.003188014030456543, -0.003031492233276367, -0.0028749704360961914, -0.0027184486389160156, -0.00256192684173584, -0.002405405044555664, -0.0022488832473754883, -0.0020923614501953125, -0.0019358396530151367, -0.001779317855834961, -0.0016227960586547852, -0.0014662742614746094, -0.0013097524642944336, -0.0011532306671142578, -0.000996708869934082, -0.0008401870727539062, -0.0006836652755737305, -0.0005271434783935547, -0.0003706216812133789, -0.00021409988403320312, -5.7578086853027344e-05, 9.894371032714844e-05, 0.0002554655075073242, 0.0004119873046875, 0.0005685091018676758, 0.0007250308990478516, 0.0008815526962280273, 0.0010380744934082031, 0.001194596290588379, 0.0013511180877685547, 0.0015076398849487305, 0.0016641616821289062, 0.001820683479309082, 0.001977205276489258, 0.0021337270736694336, 0.0022902488708496094, 0.002446770668029785, 0.002603292465209961, 0.0027598142623901367, 0.0029163360595703125, 0.0030728578567504883, 0.003229379653930664, 0.00338590145111084, 0.0035424232482910156, 0.0036989450454711914, 0.003855466842651367, 0.004011988639831543, 0.004168510437011719, 0.0043250322341918945, 0.00448155403137207, 0.004638075828552246, 0.004794597625732422, 0.004951119422912598, 0.0051076412200927734, 0.005264163017272949, 0.005420684814453125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 6.0, 4.0, 4.0, 5.0, 7.0, 8.0, 8.0, 9.0, 13.0, 17.0, 20.0, 25.0, 42.0, 34.0, 46.0, 67.0, 78.0, 82.0, 84.0, 73.0, 57.0, 64.0, 57.0, 49.0, 30.0, 24.0, 10.0, 14.0, 15.0, 6.0, 8.0, 8.0, 4.0, 3.0, 3.0, 2.0, 6.0, 1.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.143880844116211e-05, -4.9787573516368866e-05, -4.813633859157562e-05, -4.648510366678238e-05, -4.4833868741989136e-05, -4.318263381719589e-05, -4.153139889240265e-05, -3.9880163967609406e-05, -3.822892904281616e-05, -3.657769411802292e-05, -3.4926459193229675e-05, -3.327522426843643e-05, -3.162398934364319e-05, -2.9972754418849945e-05, -2.83215194940567e-05, -2.6670284569263458e-05, -2.5019049644470215e-05, -2.336781471967697e-05, -2.1716579794883728e-05, -2.0065344870090485e-05, -1.841410994529724e-05, -1.6762875020503998e-05, -1.5111640095710754e-05, -1.3460405170917511e-05, -1.1809170246124268e-05, -1.0157935321331024e-05, -8.50670039653778e-06, -6.855465471744537e-06, -5.204230546951294e-06, -3.5529956221580505e-06, -1.9017606973648071e-06, -2.505257725715637e-07, 1.4007091522216797e-06, 3.051944077014923e-06, 4.7031790018081665e-06, 6.35441392660141e-06, 8.005648851394653e-06, 9.656883776187897e-06, 1.130811870098114e-05, 1.2959353625774384e-05, 1.4610588550567627e-05, 1.626182347536087e-05, 1.7913058400154114e-05, 1.9564293324947357e-05, 2.12155282497406e-05, 2.2866763174533844e-05, 2.4517998099327087e-05, 2.616923302412033e-05, 2.7820467948913574e-05, 2.9471702873706818e-05, 3.112293779850006e-05, 3.2774172723293304e-05, 3.442540764808655e-05, 3.607664257287979e-05, 3.7727877497673035e-05, 3.937911242246628e-05, 4.103034734725952e-05, 4.2681582272052765e-05, 4.433281719684601e-05, 4.598405212163925e-05, 4.7635287046432495e-05, 4.928652197122574e-05, 5.093775689601898e-05, 5.2588991820812225e-05, 5.424022674560547e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0, 7.0, 8.0, 9.0, 10.0, 17.0, 24.0, 37.0, 63.0, 77.0, 110.0, 201.0, 308.0, 647.0, 1334.0, 3020.0, 8552.0, 30185.0, 129849.0, 527542.0, 266769.0, 56517.0, 14753.0, 4769.0, 1830.0, 833.0, 423.0, 226.0, 149.0, 87.0, 64.0, 46.0, 19.0, 22.0, 13.0, 9.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00655364990234375, -0.006347060203552246, -0.006140470504760742, -0.005933880805969238, -0.005727291107177734, -0.0055207014083862305, -0.0053141117095947266, -0.005107522010803223, -0.004900932312011719, -0.004694342613220215, -0.004487752914428711, -0.004281163215637207, -0.004074573516845703, -0.0038679838180541992, -0.0036613941192626953, -0.0034548044204711914, -0.0032482147216796875, -0.0030416250228881836, -0.0028350353240966797, -0.0026284456253051758, -0.002421855926513672, -0.002215266227722168, -0.002008676528930664, -0.0018020868301391602, -0.0015954971313476562, -0.0013889074325561523, -0.0011823177337646484, -0.0009757280349731445, -0.0007691383361816406, -0.0005625486373901367, -0.0003559589385986328, -0.0001493692398071289, 5.7220458984375e-05, 0.0002638101577758789, 0.0004703998565673828, 0.0006769895553588867, 0.0008835792541503906, 0.0010901689529418945, 0.0012967586517333984, 0.0015033483505249023, 0.0017099380493164062, 0.0019165277481079102, 0.002123117446899414, 0.002329707145690918, 0.002536296844482422, 0.0027428865432739258, 0.0029494762420654297, 0.0031560659408569336, 0.0033626556396484375, 0.0035692453384399414, 0.0037758350372314453, 0.003982424736022949, 0.004189014434814453, 0.004395604133605957, 0.004602193832397461, 0.004808783531188965, 0.005015373229980469, 0.005221962928771973, 0.0054285526275634766, 0.0056351423263549805, 0.005841732025146484, 0.006048321723937988, 0.006254911422729492, 0.006461501121520996, 0.0066680908203125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 3.0, 10.0, 6.0, 9.0, 13.0, 10.0, 14.0, 9.0, 14.0, 27.0, 33.0, 40.0, 62.0, 63.0, 78.0, 103.0, 91.0, 76.0, 77.0, 61.0, 38.0, 44.0, 18.0, 17.0, 10.0, 9.0, 10.0, 10.0, 4.0, 11.0, 7.0, 5.0, 4.0, 2.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004180908203125, -0.004029631614685059, -0.003878355026245117, -0.0037270784378051758, -0.0035758018493652344, -0.003424525260925293, -0.0032732486724853516, -0.00312197208404541, -0.0029706954956054688, -0.0028194189071655273, -0.002668142318725586, -0.0025168657302856445, -0.002365589141845703, -0.0022143125534057617, -0.0020630359649658203, -0.001911759376525879, -0.0017604827880859375, -0.001609206199645996, -0.0014579296112060547, -0.0013066530227661133, -0.0011553764343261719, -0.0010040998458862305, -0.0008528232574462891, -0.0007015466690063477, -0.0005502700805664062, -0.00039899349212646484, -0.00024771690368652344, -9.644031524658203e-05, 5.4836273193359375e-05, 0.00020611286163330078, 0.0003573894500732422, 0.0005086660385131836, 0.000659942626953125, 0.0008112192153930664, 0.0009624958038330078, 0.0011137723922729492, 0.0012650489807128906, 0.001416325569152832, 0.0015676021575927734, 0.0017188787460327148, 0.0018701553344726562, 0.0020214319229125977, 0.002172708511352539, 0.0023239850997924805, 0.002475261688232422, 0.0026265382766723633, 0.0027778148651123047, 0.002929091453552246, 0.0030803680419921875, 0.003231644630432129, 0.0033829212188720703, 0.0035341978073120117, 0.003685474395751953, 0.0038367509841918945, 0.003988027572631836, 0.004139304161071777, 0.004290580749511719, 0.00444185733795166, 0.0045931339263916016, 0.004744410514831543, 0.004895687103271484, 0.005046963691711426, 0.005198240280151367, 0.005349516868591309, 0.00550079345703125]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 37.0, 66.0, 165.0, 254.0, 258.0, 122.0, 57.0, 16.0, 9.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11946487426757812, -0.11543509364128113, -0.11140531301498413, -0.10737553238868713, -0.10334575176239014, -0.09931597113609314, -0.09528619050979614, -0.09125640988349915, -0.08722662925720215, -0.08319684863090515, -0.07916706800460815, -0.07513728737831116, -0.07110750675201416, -0.06707772612571716, -0.06304794549942017, -0.05901816114783287, -0.054988376796245575, -0.05095859616994858, -0.04692881554365158, -0.042899034917354584, -0.03886925429105759, -0.03483947366476059, -0.030809689313173294, -0.026779908686876297, -0.0227501280605793, -0.018720347434282303, -0.014690565876662731, -0.01066078431904316, -0.006631003692746162, -0.0026012230664491653, 0.001428559422492981, 0.005458340048789978, 0.009488120675086975, 0.013517901301383972, 0.01754768192768097, 0.021577464416623116, 0.025607245042920113, 0.02963702566921711, 0.033666808158159256, 0.03769658878445625, 0.04172636941075325, 0.04575615003705025, 0.049785930663347244, 0.05381571501493454, 0.05784549564123154, 0.061875276267528534, 0.06590505689382553, 0.06993483752012253, 0.07396461814641953, 0.07799439877271652, 0.08202417939901352, 0.08605396002531052, 0.09008374065160751, 0.09411352127790451, 0.0981433093547821, 0.1021730899810791, 0.1062028706073761, 0.1102326512336731, 0.11426243185997009, 0.11829221248626709, 0.12232199311256409, 0.12635177373886108, 0.13038155436515808, 0.13441133499145508, 0.13844111561775208]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 0.0, 4.0, 6.0, 10.0, 12.0, 7.0, 5.0, 9.0, 21.0, 20.0, 16.0, 31.0, 29.0, 24.0, 34.0, 32.0, 30.0, 24.0, 45.0, 49.0, 42.0, 40.0, 36.0, 30.0, 47.0, 39.0, 33.0, 32.0, 39.0, 35.0, 34.0, 24.0, 19.0, 20.0, 19.0, 18.0, 22.0, 13.0, 13.0, 9.0, 7.0, 5.0, 5.0, 5.0, 4.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.04824399948120117, -0.04679631069302559, -0.045348621904850006, -0.04390093684196472, -0.04245324805378914, -0.041005559265613556, -0.03955787420272827, -0.03811018541455269, -0.036662496626377106, -0.03521480783820152, -0.03376711905002594, -0.032319433987140656, -0.030871745198965073, -0.02942405641078949, -0.027976369485259056, -0.026528682559728622, -0.02508099377155304, -0.023633304983377457, -0.022185618057847023, -0.02073793113231659, -0.019290242344141006, -0.017842553555965424, -0.01639486663043499, -0.014947178773581982, -0.013499490916728973, -0.012051803059875965, -0.010604115203022957, -0.009156427346169949, -0.00770873948931694, -0.006261051632463932, -0.004813363775610924, -0.0033656759187579155, -0.0019179880619049072, -0.00047030020505189896, 0.0009773876518011093, 0.0024250755086541176, 0.003872763365507126, 0.005320451222360134, 0.006768139079213142, 0.00821582693606615, 0.009663514792919159, 0.011111202649772167, 0.012558890506625175, 0.014006578363478184, 0.015454266220331192, 0.016901955008506775, 0.01834964193403721, 0.019797328859567642, 0.021245017647743225, 0.022692706435918808, 0.02414039336144924, 0.025588080286979675, 0.027035769075155258, 0.02848345786333084, 0.029931144788861275, 0.03137883171439171, 0.03282652050256729, 0.034274209290742874, 0.03572189807891846, 0.03716958314180374, 0.038617271929979324, 0.04006496071815491, 0.04151264578104019, 0.042960334569215775, 0.04440802335739136]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 13.0, 15.0, 23.0, 64.0, 109.0, 246.0, 649.0, 2918.0, 16871.0, 4038820.0, 127585.0, 5306.0, 981.0, 330.0, 178.0, 84.0, 39.0, 32.0, 9.0, 5.0, 6.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046356201171875, -0.044742584228515625, -0.04312896728515625, -0.041515350341796875, -0.0399017333984375, -0.038288116455078125, -0.03667449951171875, -0.035060882568359375, -0.033447265625, -0.031833648681640625, -0.03022003173828125, -0.028606414794921875, -0.0269927978515625, -0.025379180908203125, -0.02376556396484375, -0.022151947021484375, -0.020538330078125, -0.018924713134765625, -0.01731109619140625, -0.015697479248046875, -0.0140838623046875, -0.012470245361328125, -0.01085662841796875, -0.009243011474609375, -0.00762939453125, -0.006015777587890625, -0.00440216064453125, -0.002788543701171875, -0.0011749267578125, 0.000438690185546875, 0.00205230712890625, 0.003665924072265625, 0.005279541015625, 0.006893157958984375, 0.00850677490234375, 0.010120391845703125, 0.0117340087890625, 0.013347625732421875, 0.01496124267578125, 0.016574859619140625, 0.0181884765625, 0.019802093505859375, 0.02141571044921875, 0.023029327392578125, 0.0246429443359375, 0.026256561279296875, 0.02787017822265625, 0.029483795166015625, 0.031097412109375, 0.032711029052734375, 0.03432464599609375, 0.035938262939453125, 0.0375518798828125, 0.039165496826171875, 0.04077911376953125, 0.042392730712890625, 0.04400634765625, 0.045619964599609375, 0.04723358154296875, 0.048847198486328125, 0.0504608154296875, 0.052074432373046875, 0.05368804931640625, 0.055301666259765625, 0.056915283203125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 25.0, 90.0, 143.0, 157.0, 211.0, 163.0, 116.0, 63.0, 19.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0211029052734375, -0.02040576934814453, -0.019708633422851562, -0.019011497497558594, -0.018314361572265625, -0.017617225646972656, -0.016920089721679688, -0.01622295379638672, -0.01552581787109375, -0.014828681945800781, -0.014131546020507812, -0.013434410095214844, -0.012737274169921875, -0.012040138244628906, -0.011343002319335938, -0.010645866394042969, -0.00994873046875, -0.009251594543457031, -0.008554458618164062, -0.007857322692871094, -0.007160186767578125, -0.006463050842285156, -0.0057659149169921875, -0.005068778991699219, -0.00437164306640625, -0.0036745071411132812, -0.0029773712158203125, -0.0022802352905273438, -0.001583099365234375, -0.0008859634399414062, -0.0001888275146484375, 0.0005083084106445312, 0.0012054443359375, 0.0019025802612304688, 0.0025997161865234375, 0.0032968521118164062, 0.003993988037109375, 0.004691123962402344, 0.0053882598876953125, 0.006085395812988281, 0.00678253173828125, 0.007479667663574219, 0.008176803588867188, 0.008873939514160156, 0.009571075439453125, 0.010268211364746094, 0.010965347290039062, 0.011662483215332031, 0.012359619140625, 0.013056755065917969, 0.013753890991210938, 0.014451026916503906, 0.015148162841796875, 0.015845298767089844, 0.016542434692382812, 0.01723957061767578, 0.01793670654296875, 0.01863384246826172, 0.019330978393554688, 0.020028114318847656, 0.020725250244140625, 0.021422386169433594, 0.022119522094726562, 0.02281665802001953, 0.0235137939453125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 6.0, 8.0, 10.0, 7.0, 10.0, 15.0, 31.0, 48.0, 66.0, 90.0, 173.0, 279.0, 424.0, 735.0, 1225.0, 2469.0, 5838.0, 17978.0, 78009.0, 792114.0, 3081826.0, 165065.0, 31274.0, 9086.0, 3476.0, 1706.0, 894.0, 516.0, 336.0, 211.0, 120.0, 74.0, 48.0, 24.0, 33.0, 15.0, 10.0, 6.0, 6.0, 7.0, 2.0, 4.0, 2.0, 3.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01238250732421875, -0.011943459510803223, -0.011504411697387695, -0.011065363883972168, -0.01062631607055664, -0.010187268257141113, -0.009748220443725586, -0.009309172630310059, -0.008870124816894531, -0.008431077003479004, -0.007992029190063477, -0.007552981376647949, -0.007113933563232422, -0.0066748857498168945, -0.006235837936401367, -0.00579679012298584, -0.0053577423095703125, -0.004918694496154785, -0.004479646682739258, -0.0040405988693237305, -0.003601551055908203, -0.0031625032424926758, -0.0027234554290771484, -0.002284407615661621, -0.0018453598022460938, -0.0014063119888305664, -0.0009672641754150391, -0.0005282163619995117, -8.916854858398438e-05, 0.00034987926483154297, 0.0007889270782470703, 0.0012279748916625977, 0.001667022705078125, 0.0021060705184936523, 0.0025451183319091797, 0.002984166145324707, 0.0034232139587402344, 0.0038622617721557617, 0.004301309585571289, 0.004740357398986816, 0.005179405212402344, 0.005618453025817871, 0.0060575008392333984, 0.006496548652648926, 0.006935596466064453, 0.0073746442794799805, 0.007813692092895508, 0.008252739906311035, 0.008691787719726562, 0.00913083553314209, 0.009569883346557617, 0.010008931159973145, 0.010447978973388672, 0.0108870267868042, 0.011326074600219727, 0.011765122413635254, 0.012204170227050781, 0.012643218040466309, 0.013082265853881836, 0.013521313667297363, 0.01396036148071289, 0.014399409294128418, 0.014838457107543945, 0.015277504920959473, 0.015716552734375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 5.0, 2.0, 5.0, 8.0, 15.0, 32.0, 51.0, 95.0, 176.0, 364.0, 1173.0, 1297.0, 425.0, 172.0, 90.0, 71.0, 30.0, 28.0, 14.0, 9.0, 8.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0161285400390625, -0.015510320663452148, -0.014892101287841797, -0.014273881912231445, -0.013655662536621094, -0.013037443161010742, -0.01241922378540039, -0.011801004409790039, -0.011182785034179688, -0.010564565658569336, -0.009946346282958984, -0.009328126907348633, -0.008709907531738281, -0.00809168815612793, -0.007473468780517578, -0.0068552494049072266, -0.006237030029296875, -0.0056188106536865234, -0.005000591278076172, -0.00438237190246582, -0.0037641525268554688, -0.003145933151245117, -0.0025277137756347656, -0.001909494400024414, -0.0012912750244140625, -0.0006730556488037109, -5.4836273193359375e-05, 0.0005633831024169922, 0.0011816024780273438, 0.0017998218536376953, 0.002418041229248047, 0.0030362606048583984, 0.00365447998046875, 0.0042726993560791016, 0.004890918731689453, 0.005509138107299805, 0.006127357482910156, 0.006745576858520508, 0.007363796234130859, 0.007982015609741211, 0.008600234985351562, 0.009218454360961914, 0.009836673736572266, 0.010454893112182617, 0.011073112487792969, 0.01169133186340332, 0.012309551239013672, 0.012927770614624023, 0.013545989990234375, 0.014164209365844727, 0.014782428741455078, 0.01540064811706543, 0.01601886749267578, 0.016637086868286133, 0.017255306243896484, 0.017873525619506836, 0.018491744995117188, 0.01910996437072754, 0.01972818374633789, 0.020346403121948242, 0.020964622497558594, 0.021582841873168945, 0.022201061248779297, 0.02281928062438965, 0.0234375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 7.0, 13.0, 39.0, 78.0, 134.0, 195.0, 211.0, 158.0, 92.0, 41.0, 13.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.13335302472114563, -0.13037721812725067, -0.1274014115333557, -0.12442560493946075, -0.1214497983455658, -0.11847399175167084, -0.11549818515777588, -0.11252237111330032, -0.10954656451940536, -0.1065707579255104, -0.10359495133161545, -0.10061914473772049, -0.09764333814382553, -0.09466752409934998, -0.09169171750545502, -0.08871591091156006, -0.0857401043176651, -0.08276429772377014, -0.07978849112987518, -0.07681268453598022, -0.07383687794208527, -0.07086107134819031, -0.06788526475429535, -0.0649094507098198, -0.06193365156650543, -0.058957844972610474, -0.055982038378715515, -0.05300623178482056, -0.0500304214656353, -0.04705461487174034, -0.04407880827784538, -0.041102997958660126, -0.03812718763947487, -0.03515138104557991, -0.03217557445168495, -0.029199765995144844, -0.026223957538604736, -0.023248150944709778, -0.02027234435081482, -0.01729653589427471, -0.014320729300379753, -0.01134492177516222, -0.008369114249944687, -0.005393307656049728, -0.0024175001308321953, 0.0005583073943853378, 0.0035341139882802963, 0.006509922444820404, 0.009485729038715363, 0.012461536563932896, 0.015437344089150429, 0.018413150683045387, 0.021388959139585495, 0.024364765733480453, 0.027340572327375412, 0.03031638078391552, 0.03329218924045563, 0.036267995834350586, 0.039243802428245544, 0.0422196090221405, 0.04519541934132576, 0.04817122593522072, 0.05114703252911568, 0.054122842848300934, 0.057098645716905594]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 9.0, 6.0, 6.0, 10.0, 18.0, 20.0, 25.0, 33.0, 36.0, 38.0, 38.0, 22.0, 38.0, 51.0, 41.0, 54.0, 53.0, 52.0, 45.0, 42.0, 53.0, 46.0, 58.0, 31.0, 29.0, 29.0, 29.0, 24.0, 14.0, 10.0, 10.0, 7.0, 6.0, 2.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.046895623207092285, -0.04558660089969635, -0.04427757486701012, -0.04296854883432388, -0.04165952652692795, -0.04035050421953201, -0.03904147818684578, -0.037732452154159546, -0.03642342984676361, -0.035114407539367676, -0.03380538150668144, -0.03249635547399521, -0.031187333166599274, -0.02987830899655819, -0.028569284826517105, -0.02726026065647602, -0.025951236486434937, -0.024642212316393852, -0.023333188146352768, -0.022024163976311684, -0.0207151398062706, -0.019406115636229515, -0.01809709146618843, -0.016788067296147346, -0.015479043126106262, -0.014170018956065178, -0.012860994786024094, -0.01155197061598301, -0.010242946445941925, -0.00893392227590084, -0.0076248981058597565, -0.006315873935818672, -0.005006849765777588, -0.0036978255957365036, -0.0023888014256954193, -0.001079777255654335, 0.00022924691438674927, 0.0015382710844278336, 0.002847295254468918, 0.004156319424510002, 0.005465343594551086, 0.006774367764592171, 0.008083391934633255, 0.00939241610467434, 0.010701440274715424, 0.012010464444756508, 0.013319488614797592, 0.014628512784838676, 0.01593753695487976, 0.017246561124920845, 0.01855558529496193, 0.019864609465003014, 0.021173633635044098, 0.022482657805085182, 0.023791681975126266, 0.02510070614516735, 0.026409730315208435, 0.02771875448524952, 0.029027778655290604, 0.030336802825331688, 0.03164582699537277, 0.03295484930276871, 0.03426387533545494, 0.035572901368141174, 0.03688192367553711]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 4.0, 10.0, 8.0, 13.0, 22.0, 23.0, 37.0, 35.0, 63.0, 72.0, 110.0, 171.0, 246.0, 366.0, 560.0, 1213.0, 3118.0, 16789.0, 290099.0, 690403.0, 36581.0, 4984.0, 1513.0, 713.0, 442.0, 277.0, 199.0, 135.0, 90.0, 59.0, 55.0, 28.0, 28.0, 20.0, 16.0, 13.0, 8.0, 7.0, 6.0, 2.0, 6.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0413818359375, -0.04009532928466797, -0.03880882263183594, -0.037522315979003906, -0.036235809326171875, -0.034949302673339844, -0.03366279602050781, -0.03237628936767578, -0.03108978271484375, -0.02980327606201172, -0.028516769409179688, -0.027230262756347656, -0.025943756103515625, -0.024657249450683594, -0.023370742797851562, -0.02208423614501953, -0.0207977294921875, -0.01951122283935547, -0.018224716186523438, -0.016938209533691406, -0.015651702880859375, -0.014365196228027344, -0.013078689575195312, -0.011792182922363281, -0.01050567626953125, -0.009219169616699219, -0.007932662963867188, -0.006646156311035156, -0.005359649658203125, -0.004073143005371094, -0.0027866363525390625, -0.0015001296997070312, -0.000213623046875, 0.0010728836059570312, 0.0023593902587890625, 0.0036458969116210938, 0.004932403564453125, 0.006218910217285156, 0.0075054168701171875, 0.008791923522949219, 0.01007843017578125, 0.011364936828613281, 0.012651443481445312, 0.013937950134277344, 0.015224456787109375, 0.016510963439941406, 0.017797470092773438, 0.01908397674560547, 0.0203704833984375, 0.02165699005126953, 0.022943496704101562, 0.024230003356933594, 0.025516510009765625, 0.026803016662597656, 0.028089523315429688, 0.02937602996826172, 0.03066253662109375, 0.03194904327392578, 0.03323554992675781, 0.034522056579589844, 0.035808563232421875, 0.037095069885253906, 0.03838157653808594, 0.03966808319091797, 0.04095458984375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 44.0, 89.0, 149.0, 168.0, 207.0, 149.0, 111.0, 55.0, 12.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0226287841796875, -0.02190113067626953, -0.021173477172851562, -0.020445823669433594, -0.019718170166015625, -0.018990516662597656, -0.018262863159179688, -0.01753520965576172, -0.01680755615234375, -0.01607990264892578, -0.015352249145507812, -0.014624595642089844, -0.013896942138671875, -0.013169288635253906, -0.012441635131835938, -0.011713981628417969, -0.010986328125, -0.010258674621582031, -0.009531021118164062, -0.008803367614746094, -0.008075714111328125, -0.007348060607910156, -0.0066204071044921875, -0.005892753601074219, -0.00516510009765625, -0.004437446594238281, -0.0037097930908203125, -0.0029821395874023438, -0.002254486083984375, -0.0015268325805664062, -0.0007991790771484375, -7.152557373046875e-05, 0.0006561279296875, 0.0013837814331054688, 0.0021114349365234375, 0.0028390884399414062, 0.003566741943359375, 0.004294395446777344, 0.0050220489501953125, 0.005749702453613281, 0.00647735595703125, 0.007205009460449219, 0.007932662963867188, 0.008660316467285156, 0.009387969970703125, 0.010115623474121094, 0.010843276977539062, 0.011570930480957031, 0.012298583984375, 0.013026237487792969, 0.013753890991210938, 0.014481544494628906, 0.015209197998046875, 0.015936851501464844, 0.016664505004882812, 0.01739215850830078, 0.01811981201171875, 0.01884746551513672, 0.019575119018554688, 0.020302772521972656, 0.021030426025390625, 0.021758079528808594, 0.022485733032226562, 0.02321338653564453, 0.0239410400390625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 5.0, 12.0, 8.0, 11.0, 17.0, 29.0, 43.0, 68.0, 59.0, 131.0, 183.0, 334.0, 594.0, 1107.0, 2106.0, 4406.0, 9797.0, 26866.0, 96809.0, 414529.0, 366834.0, 83120.0, 23938.0, 9043.0, 4130.0, 1928.0, 1078.0, 557.0, 301.0, 177.0, 102.0, 70.0, 41.0, 39.0, 15.0, 24.0, 14.0, 7.0, 8.0, 4.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.0216064453125, -0.02100539207458496, -0.020404338836669922, -0.019803285598754883, -0.019202232360839844, -0.018601179122924805, -0.018000125885009766, -0.017399072647094727, -0.016798019409179688, -0.01619696617126465, -0.01559591293334961, -0.01499485969543457, -0.014393806457519531, -0.013792753219604492, -0.013191699981689453, -0.012590646743774414, -0.011989593505859375, -0.011388540267944336, -0.010787487030029297, -0.010186433792114258, -0.009585380554199219, -0.00898432731628418, -0.00838327407836914, -0.0077822208404541016, -0.0071811676025390625, -0.0065801143646240234, -0.005979061126708984, -0.005378007888793945, -0.004776954650878906, -0.004175901412963867, -0.003574848175048828, -0.002973794937133789, -0.00237274169921875, -0.001771688461303711, -0.0011706352233886719, -0.0005695819854736328, 3.147125244140625e-05, 0.0006325244903564453, 0.0012335777282714844, 0.0018346309661865234, 0.0024356842041015625, 0.0030367374420166016, 0.0036377906799316406, 0.00423884391784668, 0.004839897155761719, 0.005440950393676758, 0.006042003631591797, 0.006643056869506836, 0.007244110107421875, 0.007845163345336914, 0.008446216583251953, 0.009047269821166992, 0.009648323059082031, 0.01024937629699707, 0.01085042953491211, 0.011451482772827148, 0.012052536010742188, 0.012653589248657227, 0.013254642486572266, 0.013855695724487305, 0.014456748962402344, 0.015057802200317383, 0.015658855438232422, 0.01625990867614746, 0.0168609619140625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 3.0, 6.0, 4.0, 12.0, 8.0, 7.0, 13.0, 20.0, 19.0, 22.0, 33.0, 37.0, 40.0, 52.0, 51.0, 64.0, 75.0, 82.0, 58.0, 53.0, 49.0, 40.0, 45.0, 37.0, 33.0, 32.0, 26.0, 24.0, 9.0, 6.0, 13.0, 7.0, 8.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0249176025390625, -0.02414870262145996, -0.023379802703857422, -0.022610902786254883, -0.021842002868652344, -0.021073102951049805, -0.020304203033447266, -0.019535303115844727, -0.018766403198242188, -0.01799750328063965, -0.01722860336303711, -0.01645970344543457, -0.01569080352783203, -0.014921903610229492, -0.014153003692626953, -0.013384103775024414, -0.012615203857421875, -0.011846303939819336, -0.011077404022216797, -0.010308504104614258, -0.009539604187011719, -0.00877070426940918, -0.00800180435180664, -0.0072329044342041016, -0.0064640045166015625, -0.0056951045989990234, -0.004926204681396484, -0.004157304763793945, -0.0033884048461914062, -0.002619504928588867, -0.0018506050109863281, -0.001081705093383789, -0.00031280517578125, 0.00045609474182128906, 0.0012249946594238281, 0.001993894577026367, 0.0027627944946289062, 0.0035316944122314453, 0.004300594329833984, 0.0050694942474365234, 0.0058383941650390625, 0.0066072940826416016, 0.007376194000244141, 0.00814509391784668, 0.008913993835449219, 0.009682893753051758, 0.010451793670654297, 0.011220693588256836, 0.011989593505859375, 0.012758493423461914, 0.013527393341064453, 0.014296293258666992, 0.015065193176269531, 0.01583409309387207, 0.01660299301147461, 0.01737189292907715, 0.018140792846679688, 0.018909692764282227, 0.019678592681884766, 0.020447492599487305, 0.021216392517089844, 0.021985292434692383, 0.022754192352294922, 0.02352309226989746, 0.0242919921875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 8.0, 3.0, 4.0, 7.0, 14.0, 25.0, 32.0, 40.0, 62.0, 98.0, 163.0, 273.0, 513.0, 883.0, 1763.0, 3579.0, 7468.0, 16722.0, 41461.0, 134433.0, 514361.0, 224882.0, 59854.0, 22523.0, 9877.0, 4670.0, 2246.0, 1156.0, 619.0, 325.0, 174.0, 106.0, 67.0, 42.0, 34.0, 27.0, 16.0, 12.0, 5.0, 10.0, 5.0, 0.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0072021484375, -0.006959438323974609, -0.006716728210449219, -0.006474018096923828, -0.0062313079833984375, -0.005988597869873047, -0.005745887756347656, -0.005503177642822266, -0.005260467529296875, -0.005017757415771484, -0.004775047302246094, -0.004532337188720703, -0.0042896270751953125, -0.004046916961669922, -0.0038042068481445312, -0.0035614967346191406, -0.00331878662109375, -0.0030760765075683594, -0.0028333663940429688, -0.002590656280517578, -0.0023479461669921875, -0.002105236053466797, -0.0018625259399414062, -0.0016198158264160156, -0.001377105712890625, -0.0011343955993652344, -0.0008916854858398438, -0.0006489753723144531, -0.0004062652587890625, -0.00016355514526367188, 7.915496826171875e-05, 0.0003218650817871094, 0.0005645751953125, 0.0008072853088378906, 0.0010499954223632812, 0.0012927055358886719, 0.0015354156494140625, 0.0017781257629394531, 0.0020208358764648438, 0.0022635459899902344, 0.002506256103515625, 0.0027489662170410156, 0.0029916763305664062, 0.003234386444091797, 0.0034770965576171875, 0.003719806671142578, 0.003962516784667969, 0.004205226898193359, 0.00444793701171875, 0.004690647125244141, 0.004933357238769531, 0.005176067352294922, 0.0054187774658203125, 0.005661487579345703, 0.005904197692871094, 0.006146907806396484, 0.006389617919921875, 0.006632328033447266, 0.006875038146972656, 0.007117748260498047, 0.0073604583740234375, 0.007603168487548828, 0.007845878601074219, 0.00808858871459961, 0.008331298828125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 12.0, 19.0, 23.0, 34.0, 49.0, 60.0, 67.0, 76.0, 88.0, 71.0, 93.0, 71.0, 81.0, 63.0, 54.0, 31.0, 25.0, 21.0, 9.0, 5.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-5.9664249420166016e-05, -5.7783909142017365e-05, -5.590356886386871e-05, -5.402322858572006e-05, -5.214288830757141e-05, -5.026254802942276e-05, -4.838220775127411e-05, -4.650186747312546e-05, -4.462152719497681e-05, -4.2741186916828156e-05, -4.0860846638679504e-05, -3.898050636053085e-05, -3.71001660823822e-05, -3.521982580423355e-05, -3.33394855260849e-05, -3.145914524793625e-05, -2.9578804969787598e-05, -2.7698464691638947e-05, -2.5818124413490295e-05, -2.3937784135341644e-05, -2.2057443857192993e-05, -2.0177103579044342e-05, -1.829676330089569e-05, -1.641642302274704e-05, -1.4536082744598389e-05, -1.2655742466449738e-05, -1.0775402188301086e-05, -8.895061910152435e-06, -7.014721632003784e-06, -5.134381353855133e-06, -3.254041075706482e-06, -1.3737007975578308e-06, 5.066394805908203e-07, 2.3869797587394714e-06, 4.2673200368881226e-06, 6.147660315036774e-06, 8.028000593185425e-06, 9.908340871334076e-06, 1.1788681149482727e-05, 1.3669021427631378e-05, 1.554936170578003e-05, 1.742970198392868e-05, 1.931004226207733e-05, 2.1190382540225983e-05, 2.3070722818374634e-05, 2.4951063096523285e-05, 2.6831403374671936e-05, 2.8711743652820587e-05, 3.059208393096924e-05, 3.247242420911789e-05, 3.435276448726654e-05, 3.623310476541519e-05, 3.811344504356384e-05, 3.9993785321712494e-05, 4.1874125599861145e-05, 4.3754465878009796e-05, 4.563480615615845e-05, 4.75151464343071e-05, 4.939548671245575e-05, 5.12758269906044e-05, 5.315616726875305e-05, 5.50365075469017e-05, 5.6916847825050354e-05, 5.8797188103199005e-05, 6.0677528381347656e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 6.0, 4.0, 7.0, 16.0, 20.0, 22.0, 36.0, 55.0, 100.0, 153.0, 324.0, 687.0, 1454.0, 3527.0, 9388.0, 29239.0, 114672.0, 585012.0, 230291.0, 49610.0, 14770.0, 5127.0, 2077.0, 933.0, 450.0, 233.0, 130.0, 77.0, 46.0, 32.0, 14.0, 11.0, 3.0, 7.0, 9.0, 6.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.01105499267578125, -0.010736465454101562, -0.010417938232421875, -0.010099411010742188, -0.0097808837890625, -0.009462356567382812, -0.009143829345703125, -0.008825302124023438, -0.00850677490234375, -0.008188247680664062, -0.007869720458984375, -0.0075511932373046875, -0.007232666015625, -0.0069141387939453125, -0.006595611572265625, -0.0062770843505859375, -0.00595855712890625, -0.0056400299072265625, -0.005321502685546875, -0.0050029754638671875, -0.0046844482421875, -0.0043659210205078125, -0.004047393798828125, -0.0037288665771484375, -0.00341033935546875, -0.0030918121337890625, -0.002773284912109375, -0.0024547576904296875, -0.00213623046875, -0.0018177032470703125, -0.001499176025390625, -0.0011806488037109375, -0.00086212158203125, -0.0005435943603515625, -0.000225067138671875, 9.34600830078125e-05, 0.0004119873046875, 0.0007305145263671875, 0.001049041748046875, 0.0013675689697265625, 0.00168609619140625, 0.0020046234130859375, 0.002323150634765625, 0.0026416778564453125, 0.002960205078125, 0.0032787322998046875, 0.003597259521484375, 0.0039157867431640625, 0.00423431396484375, 0.0045528411865234375, 0.004871368408203125, 0.0051898956298828125, 0.0055084228515625, 0.0058269500732421875, 0.006145477294921875, 0.0064640045166015625, 0.00678253173828125, 0.0071010589599609375, 0.007419586181640625, 0.0077381134033203125, 0.008056640625, 0.008375167846679688, 0.008693695068359375, 0.009012222290039062, 0.00933074951171875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 3.0, 5.0, 13.0, 16.0, 20.0, 24.0, 29.0, 23.0, 43.0, 57.0, 88.0, 158.0, 160.0, 80.0, 52.0, 46.0, 40.0, 26.0, 28.0, 17.0, 17.0, 11.0, 5.0, 6.0, 3.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006984710693359375, -0.006715595722198486, -0.006446480751037598, -0.006177365779876709, -0.00590825080871582, -0.005639135837554932, -0.005370020866394043, -0.005100905895233154, -0.004831790924072266, -0.004562675952911377, -0.004293560981750488, -0.0040244460105896, -0.003755331039428711, -0.0034862160682678223, -0.0032171010971069336, -0.002947986125946045, -0.0026788711547851562, -0.0024097561836242676, -0.002140641212463379, -0.0018715262413024902, -0.0016024112701416016, -0.0013332962989807129, -0.0010641813278198242, -0.0007950663566589355, -0.0005259513854980469, -0.0002568364143371582, 1.2278556823730469e-05, 0.00028139352798461914, 0.0005505084991455078, 0.0008196234703063965, 0.0010887384414672852, 0.0013578534126281738, 0.0016269683837890625, 0.0018960833549499512, 0.00216519832611084, 0.0024343132972717285, 0.002703428268432617, 0.002972543239593506, 0.0032416582107543945, 0.003510773181915283, 0.003779888153076172, 0.0040490031242370605, 0.004318118095397949, 0.004587233066558838, 0.0048563480377197266, 0.005125463008880615, 0.005394577980041504, 0.005663692951202393, 0.005932807922363281, 0.00620192289352417, 0.006471037864685059, 0.006740152835845947, 0.007009267807006836, 0.007278382778167725, 0.007547497749328613, 0.007816612720489502, 0.00808572769165039, 0.00835484266281128, 0.008623957633972168, 0.008893072605133057, 0.009162187576293945, 0.009431302547454834, 0.009700417518615723, 0.009969532489776611, 0.0102386474609375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 12.0, 14.0, 42.0, 71.0, 133.0, 183.0, 170.0, 150.0, 99.0, 57.0, 31.0, 18.0, 7.0, 4.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09029798209667206, -0.0861680805683136, -0.08203817903995514, -0.07790827006101608, -0.07377836853265762, -0.06964846700429916, -0.06551855802536011, -0.06138865649700165, -0.05725875496864319, -0.05312885344028473, -0.04899894818663597, -0.04486904293298721, -0.040739141404628754, -0.036609239876270294, -0.032479334622621536, -0.028349431231617928, -0.02421952784061432, -0.02008962444961071, -0.0159597210586071, -0.011829817667603493, -0.007699914276599884, -0.0035700108855962753, 0.0005598925054073334, 0.004689795896410942, 0.00881969928741455, 0.01294960267841816, 0.017079506069421768, 0.021209409460425377, 0.025339312851428986, 0.029469216242432594, 0.0335991196334362, 0.03772902488708496, 0.04185891151428223, 0.045988813042640686, 0.050118718296289444, 0.0542486235499382, 0.05837852507829666, 0.06250842660665512, 0.06663833558559418, 0.07076823711395264, 0.0748981386423111, 0.07902804017066956, 0.08315794169902802, 0.08728785067796707, 0.09141775220632553, 0.09554765373468399, 0.09967756271362305, 0.1038074642419815, 0.10793736577033997, 0.11206726729869843, 0.11619716882705688, 0.12032707780599594, 0.1244569793343544, 0.12858688831329346, 0.13271678984165192, 0.13684669137001038, 0.14097659289836884, 0.1451064944267273, 0.14923639595508575, 0.1533662974834442, 0.15749621391296387, 0.16162611544132233, 0.1657560169696808, 0.16988591849803925, 0.1740158200263977]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 7.0, 11.0, 12.0, 11.0, 14.0, 18.0, 33.0, 23.0, 36.0, 33.0, 33.0, 35.0, 38.0, 60.0, 59.0, 64.0, 52.0, 48.0, 48.0, 44.0, 41.0, 47.0, 52.0, 36.0, 24.0, 22.0, 22.0, 14.0, 18.0, 10.0, 5.0, 7.0, 7.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0652388334274292, -0.06305601447820663, -0.06087320297956467, -0.0586903840303421, -0.056507568806409836, -0.05432475358247757, -0.052141934633255005, -0.04995911940932274, -0.04777630418539047, -0.045593488961458206, -0.04341067373752594, -0.041227854788303375, -0.03904503956437111, -0.03686222434043884, -0.03467940539121628, -0.03249659016728401, -0.030313774943351746, -0.02813095971941948, -0.025948142632842064, -0.02376532554626465, -0.021582510322332382, -0.019399695098400116, -0.0172168780118227, -0.01503406185656786, -0.012851245701313019, -0.010668429546058178, -0.008485613390803337, -0.006302797235548496, -0.004119981080293655, -0.0019371649250388145, 0.0002456512302160263, 0.002428467385470867, 0.004611283540725708, 0.006794099695980549, 0.00897691585123539, 0.01115973200649023, 0.013342548161745071, 0.015525364316999912, 0.017708180472254753, 0.01989099755883217, 0.022073812782764435, 0.0242566280066967, 0.026439445093274117, 0.028622262179851532, 0.030805077403783798, 0.032987892627716064, 0.03517071157693863, 0.037353526800870895, 0.03953634202480316, 0.04171915724873543, 0.043901972472667694, 0.04608479142189026, 0.048267606645822525, 0.05045042186975479, 0.052633240818977356, 0.05481605604290962, 0.05699887126684189, 0.059181686490774155, 0.06136450171470642, 0.06354732066392899, 0.06573013961315155, 0.06791295111179352, 0.07009577006101608, 0.07227858155965805, 0.07446140050888062]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 5.0, 9.0, 14.0, 8.0, 16.0, 14.0, 20.0, 28.0, 41.0, 51.0, 82.0, 99.0, 140.0, 223.0, 394.0, 702.0, 1701.0, 3612.0, 9481.0, 50049.0, 1706378.0, 2337990.0, 63763.0, 12140.0, 4017.0, 1526.0, 686.0, 352.0, 223.0, 140.0, 96.0, 66.0, 47.0, 32.0, 41.0, 24.0, 15.0, 17.0, 7.0, 6.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.0244598388671875, -0.02371954917907715, -0.022979259490966797, -0.022238969802856445, -0.021498680114746094, -0.020758390426635742, -0.02001810073852539, -0.01927781105041504, -0.018537521362304688, -0.017797231674194336, -0.017056941986083984, -0.016316652297973633, -0.015576362609863281, -0.01483607292175293, -0.014095783233642578, -0.013355493545532227, -0.012615203857421875, -0.011874914169311523, -0.011134624481201172, -0.01039433479309082, -0.009654045104980469, -0.008913755416870117, -0.008173465728759766, -0.007433176040649414, -0.0066928863525390625, -0.005952596664428711, -0.005212306976318359, -0.004472017288208008, -0.0037317276000976562, -0.0029914379119873047, -0.002251148223876953, -0.0015108585357666016, -0.00077056884765625, -3.0279159545898438e-05, 0.0007100105285644531, 0.0014503002166748047, 0.0021905899047851562, 0.002930879592895508, 0.0036711692810058594, 0.004411458969116211, 0.0051517486572265625, 0.005892038345336914, 0.006632328033447266, 0.007372617721557617, 0.008112907409667969, 0.00885319709777832, 0.009593486785888672, 0.010333776473999023, 0.011074066162109375, 0.011814355850219727, 0.012554645538330078, 0.01329493522644043, 0.014035224914550781, 0.014775514602661133, 0.015515804290771484, 0.016256093978881836, 0.016996383666992188, 0.01773667335510254, 0.01847696304321289, 0.019217252731323242, 0.019957542419433594, 0.020697832107543945, 0.021438121795654297, 0.02217841148376465, 0.022918701171875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 13.0, 50.0, 102.0, 184.0, 208.0, 185.0, 123.0, 95.0, 29.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0251617431640625, -0.024368762969970703, -0.023575782775878906, -0.02278280258178711, -0.021989822387695312, -0.021196842193603516, -0.02040386199951172, -0.019610881805419922, -0.018817901611328125, -0.018024921417236328, -0.01723194122314453, -0.016438961029052734, -0.015645980834960938, -0.01485300064086914, -0.014060020446777344, -0.013267040252685547, -0.01247406005859375, -0.011681079864501953, -0.010888099670410156, -0.01009511947631836, -0.009302139282226562, -0.008509159088134766, -0.007716178894042969, -0.006923198699951172, -0.006130218505859375, -0.005337238311767578, -0.004544258117675781, -0.0037512779235839844, -0.0029582977294921875, -0.0021653175354003906, -0.0013723373413085938, -0.0005793571472167969, 0.000213623046875, 0.0010066032409667969, 0.0017995834350585938, 0.0025925636291503906, 0.0033855438232421875, 0.004178524017333984, 0.004971504211425781, 0.005764484405517578, 0.006557464599609375, 0.007350444793701172, 0.008143424987792969, 0.008936405181884766, 0.009729385375976562, 0.01052236557006836, 0.011315345764160156, 0.012108325958251953, 0.01290130615234375, 0.013694286346435547, 0.014487266540527344, 0.01528024673461914, 0.016073226928710938, 0.016866207122802734, 0.01765918731689453, 0.018452167510986328, 0.019245147705078125, 0.020038127899169922, 0.02083110809326172, 0.021624088287353516, 0.022417068481445312, 0.02321004867553711, 0.024003028869628906, 0.024796009063720703, 0.0255889892578125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 6.0, 5.0, 8.0, 8.0, 13.0, 20.0, 24.0, 39.0, 59.0, 84.0, 136.0, 235.0, 386.0, 632.0, 1273.0, 2630.0, 5976.0, 17067.0, 74445.0, 731695.0, 3115389.0, 192928.0, 33318.0, 9805.0, 3928.0, 1871.0, 934.0, 530.0, 291.0, 176.0, 123.0, 70.0, 60.0, 32.0, 26.0, 24.0, 10.0, 8.0, 7.0, 6.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0158233642578125, -0.015242576599121094, -0.014661788940429688, -0.014081001281738281, -0.013500213623046875, -0.012919425964355469, -0.012338638305664062, -0.011757850646972656, -0.01117706298828125, -0.010596275329589844, -0.010015487670898438, -0.009434700012207031, -0.008853912353515625, -0.008273124694824219, -0.0076923370361328125, -0.007111549377441406, -0.00653076171875, -0.005949974060058594, -0.0053691864013671875, -0.004788398742675781, -0.004207611083984375, -0.0036268234252929688, -0.0030460357666015625, -0.0024652481079101562, -0.00188446044921875, -0.0013036727905273438, -0.0007228851318359375, -0.00014209747314453125, 0.000438690185546875, 0.0010194778442382812, 0.0016002655029296875, 0.0021810531616210938, 0.0027618408203125, 0.0033426284790039062, 0.0039234161376953125, 0.004504203796386719, 0.005084991455078125, 0.005665779113769531, 0.0062465667724609375, 0.006827354431152344, 0.00740814208984375, 0.007988929748535156, 0.008569717407226562, 0.009150505065917969, 0.009731292724609375, 0.010312080383300781, 0.010892868041992188, 0.011473655700683594, 0.012054443359375, 0.012635231018066406, 0.013216018676757812, 0.013796806335449219, 0.014377593994140625, 0.014958381652832031, 0.015539169311523438, 0.016119956970214844, 0.01670074462890625, 0.017281532287597656, 0.017862319946289062, 0.01844310760498047, 0.019023895263671875, 0.01960468292236328, 0.020185470581054688, 0.020766258239746094, 0.0213470458984375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 7.0, 12.0, 5.0, 17.0, 22.0, 31.0, 73.0, 113.0, 207.0, 446.0, 1080.0, 1053.0, 475.0, 199.0, 121.0, 78.0, 53.0, 26.0, 17.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 4.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252227783203125, -0.024522066116333008, -0.023821353912353516, -0.023120641708374023, -0.02241992950439453, -0.02171921730041504, -0.021018505096435547, -0.020317792892456055, -0.019617080688476562, -0.01891636848449707, -0.018215656280517578, -0.017514944076538086, -0.016814231872558594, -0.0161135196685791, -0.01541280746459961, -0.014712095260620117, -0.014011383056640625, -0.013310670852661133, -0.01260995864868164, -0.011909246444702148, -0.011208534240722656, -0.010507822036743164, -0.009807109832763672, -0.00910639762878418, -0.008405685424804688, -0.007704973220825195, -0.007004261016845703, -0.006303548812866211, -0.005602836608886719, -0.0049021244049072266, -0.004201412200927734, -0.003500699996948242, -0.00279998779296875, -0.002099275588989258, -0.0013985633850097656, -0.0006978511810302734, 2.86102294921875e-06, 0.0007035732269287109, 0.0014042854309082031, 0.0021049976348876953, 0.0028057098388671875, 0.0035064220428466797, 0.004207134246826172, 0.004907846450805664, 0.005608558654785156, 0.0063092708587646484, 0.007009983062744141, 0.007710695266723633, 0.008411407470703125, 0.009112119674682617, 0.00981283187866211, 0.010513544082641602, 0.011214256286621094, 0.011914968490600586, 0.012615680694580078, 0.01331639289855957, 0.014017105102539062, 0.014717817306518555, 0.015418529510498047, 0.01611924171447754, 0.01681995391845703, 0.017520666122436523, 0.018221378326416016, 0.018922090530395508, 0.019622802734375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 8.0, 26.0, 71.0, 191.0, 298.0, 266.0, 94.0, 31.0, 11.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2374257594347, -0.23108816146850586, -0.2247505784034729, -0.21841298043727875, -0.2120753824710846, -0.20573779940605164, -0.19940020143985748, -0.19306260347366333, -0.18672500550746918, -0.18038740754127502, -0.17404982447624207, -0.1677122265100479, -0.16137462854385376, -0.1550370454788208, -0.14869944751262665, -0.1423618495464325, -0.13602426648139954, -0.12968666851520538, -0.12334907799959183, -0.11701148748397827, -0.11067388951778412, -0.10433629900217056, -0.097998708486557, -0.09166111052036285, -0.0853235125541687, -0.07898592203855515, -0.07264832407236099, -0.06631073355674744, -0.059973135590553284, -0.05363554507493973, -0.04729795083403587, -0.04096035659313202, -0.034622758626937866, -0.028285164386034012, -0.021947570145130157, -0.015609977766871452, -0.009272383525967598, -0.002934791147708893, 0.0034028030931949615, 0.009740397334098816, 0.01607799157500267, 0.022415585815906525, 0.02875318005681038, 0.03509077429771423, 0.04142836481332779, 0.047765959054231644, 0.0541035532951355, 0.06044114753603935, 0.0667787417769432, 0.07311633229255676, 0.07945393025875092, 0.08579152077436447, 0.09212911874055862, 0.09846670925617218, 0.10480430722236633, 0.11114189773797989, 0.11747948825359344, 0.123817078769207, 0.13015466928482056, 0.1364922672510147, 0.14282986521720886, 0.14916744828224182, 0.15550504624843597, 0.16184264421463013, 0.16818024218082428]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 2.0, 5.0, 6.0, 6.0, 20.0, 10.0, 11.0, 26.0, 33.0, 19.0, 31.0, 42.0, 45.0, 45.0, 44.0, 52.0, 43.0, 58.0, 60.0, 58.0, 56.0, 54.0, 44.0, 39.0, 33.0, 28.0, 34.0, 23.0, 20.0, 10.0, 9.0, 7.0, 10.0, 13.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.06550824642181396, -0.06372520327568054, -0.06194215267896652, -0.0601591058075428, -0.05837605893611908, -0.05659301206469536, -0.05480996519327164, -0.053026918321847916, -0.051243871450424194, -0.04946082457900047, -0.04767777770757675, -0.04589473083615303, -0.04411168396472931, -0.04232863709330559, -0.040545590221881866, -0.038762543350458145, -0.036979496479034424, -0.0351964496076107, -0.03341340273618698, -0.03163035586476326, -0.02984730899333954, -0.028064262121915817, -0.026281215250492096, -0.024498168379068375, -0.022715121507644653, -0.020932074636220932, -0.01914902776479721, -0.01736598089337349, -0.015582934021949768, -0.013799887150526047, -0.012016840279102325, -0.010233793407678604, -0.008450746536254883, -0.0066676996648311615, -0.00488465279340744, -0.003101605921983719, -0.0013185590505599976, 0.00046448782086372375, 0.002247534692287445, 0.004030581563711166, 0.005813628435134888, 0.007596675306558609, 0.00937972217798233, 0.011162769049406052, 0.012945815920829773, 0.014728862792253494, 0.016511909663677216, 0.018294956535100937, 0.020078003406524658, 0.02186105027794838, 0.0236440971493721, 0.025427144020795822, 0.027210190892219543, 0.028993237763643265, 0.030776284635066986, 0.03255933150649071, 0.03434237837791443, 0.03612542524933815, 0.03790847212076187, 0.03969151899218559, 0.041474565863609314, 0.043257612735033035, 0.04504065960645676, 0.04682370647788048, 0.0486067533493042]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 1.0, 5.0, 7.0, 10.0, 12.0, 9.0, 14.0, 27.0, 43.0, 45.0, 66.0, 103.0, 116.0, 146.0, 266.0, 405.0, 829.0, 1924.0, 6555.0, 40570.0, 690160.0, 280306.0, 19581.0, 4239.0, 1333.0, 672.0, 352.0, 205.0, 149.0, 112.0, 44.0, 52.0, 41.0, 32.0, 26.0, 22.0, 16.0, 13.0, 9.0, 10.0, 1.0, 2.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0435791015625, -0.04201316833496094, -0.040447235107421875, -0.03888130187988281, -0.03731536865234375, -0.03574943542480469, -0.034183502197265625, -0.03261756896972656, -0.0310516357421875, -0.029485702514648438, -0.027919769287109375, -0.026353836059570312, -0.02478790283203125, -0.023221969604492188, -0.021656036376953125, -0.020090103149414062, -0.018524169921875, -0.016958236694335938, -0.015392303466796875, -0.013826370239257812, -0.01226043701171875, -0.010694503784179688, -0.009128570556640625, -0.0075626373291015625, -0.0059967041015625, -0.0044307708740234375, -0.002864837646484375, -0.0012989044189453125, 0.00026702880859375, 0.0018329620361328125, 0.003398895263671875, 0.0049648284912109375, 0.00653076171875, 0.008096694946289062, 0.009662628173828125, 0.011228561401367188, 0.01279449462890625, 0.014360427856445312, 0.015926361083984375, 0.017492294311523438, 0.0190582275390625, 0.020624160766601562, 0.022190093994140625, 0.023756027221679688, 0.02532196044921875, 0.026887893676757812, 0.028453826904296875, 0.030019760131835938, 0.031585693359375, 0.03315162658691406, 0.034717559814453125, 0.03628349304199219, 0.03784942626953125, 0.03941535949707031, 0.040981292724609375, 0.04254722595214844, 0.0441131591796875, 0.04567909240722656, 0.047245025634765625, 0.04881095886230469, 0.05037689208984375, 0.05194282531738281, 0.053508758544921875, 0.05507469177246094, 0.056640625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 21.0, 55.0, 101.0, 183.0, 194.0, 152.0, 150.0, 77.0, 48.0, 11.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0247650146484375, -0.02398514747619629, -0.023205280303955078, -0.022425413131713867, -0.021645545959472656, -0.020865678787231445, -0.020085811614990234, -0.019305944442749023, -0.018526077270507812, -0.0177462100982666, -0.01696634292602539, -0.01618647575378418, -0.015406608581542969, -0.014626741409301758, -0.013846874237060547, -0.013067007064819336, -0.012287139892578125, -0.011507272720336914, -0.010727405548095703, -0.009947538375854492, -0.009167671203613281, -0.00838780403137207, -0.007607936859130859, -0.0068280696868896484, -0.0060482025146484375, -0.0052683353424072266, -0.004488468170166016, -0.0037086009979248047, -0.0029287338256835938, -0.002148866653442383, -0.0013689994812011719, -0.0005891323089599609, 0.00019073486328125, 0.0009706020355224609, 0.0017504692077636719, 0.002530336380004883, 0.0033102035522460938, 0.004090070724487305, 0.004869937896728516, 0.0056498050689697266, 0.0064296722412109375, 0.0072095394134521484, 0.00798940658569336, 0.00876927375793457, 0.009549140930175781, 0.010329008102416992, 0.011108875274658203, 0.011888742446899414, 0.012668609619140625, 0.013448476791381836, 0.014228343963623047, 0.015008211135864258, 0.01578807830810547, 0.01656794548034668, 0.01734781265258789, 0.0181276798248291, 0.018907546997070312, 0.019687414169311523, 0.020467281341552734, 0.021247148513793945, 0.022027015686035156, 0.022806882858276367, 0.023586750030517578, 0.02436661720275879, 0.025146484375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 3.0, 4.0, 3.0, 9.0, 12.0, 14.0, 25.0, 30.0, 64.0, 102.0, 156.0, 250.0, 397.0, 765.0, 1470.0, 3045.0, 6827.0, 17946.0, 56450.0, 258351.0, 517676.0, 130451.0, 32823.0, 11868.0, 4847.0, 2249.0, 1212.0, 604.0, 332.0, 189.0, 126.0, 96.0, 61.0, 26.0, 24.0, 11.0, 8.0, 10.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.026275634765625, -0.025509357452392578, -0.024743080139160156, -0.023976802825927734, -0.023210525512695312, -0.02244424819946289, -0.02167797088623047, -0.020911693572998047, -0.020145416259765625, -0.019379138946533203, -0.01861286163330078, -0.01784658432006836, -0.017080307006835938, -0.016314029693603516, -0.015547752380371094, -0.014781475067138672, -0.01401519775390625, -0.013248920440673828, -0.012482643127441406, -0.011716365814208984, -0.010950088500976562, -0.01018381118774414, -0.009417533874511719, -0.008651256561279297, -0.007884979248046875, -0.007118701934814453, -0.006352424621582031, -0.005586147308349609, -0.0048198699951171875, -0.004053592681884766, -0.0032873153686523438, -0.002521038055419922, -0.0017547607421875, -0.0009884834289550781, -0.00022220611572265625, 0.0005440711975097656, 0.0013103485107421875, 0.0020766258239746094, 0.0028429031372070312, 0.003609180450439453, 0.004375457763671875, 0.005141735076904297, 0.005908012390136719, 0.006674289703369141, 0.0074405670166015625, 0.008206844329833984, 0.008973121643066406, 0.009739398956298828, 0.01050567626953125, 0.011271953582763672, 0.012038230895996094, 0.012804508209228516, 0.013570785522460938, 0.01433706283569336, 0.015103340148925781, 0.015869617462158203, 0.016635894775390625, 0.017402172088623047, 0.01816844940185547, 0.01893472671508789, 0.019701004028320312, 0.020467281341552734, 0.021233558654785156, 0.021999835968017578, 0.02276611328125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 3.0, 10.0, 9.0, 16.0, 16.0, 17.0, 25.0, 33.0, 38.0, 53.0, 79.0, 68.0, 62.0, 75.0, 70.0, 48.0, 60.0, 48.0, 53.0, 43.0, 33.0, 26.0, 34.0, 9.0, 22.0, 12.0, 13.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02227783203125, -0.021418094635009766, -0.02055835723876953, -0.019698619842529297, -0.018838882446289062, -0.017979145050048828, -0.017119407653808594, -0.01625967025756836, -0.015399932861328125, -0.01454019546508789, -0.013680458068847656, -0.012820720672607422, -0.011960983276367188, -0.011101245880126953, -0.010241508483886719, -0.009381771087646484, -0.00852203369140625, -0.007662296295166016, -0.006802558898925781, -0.005942821502685547, -0.0050830841064453125, -0.004223346710205078, -0.0033636093139648438, -0.0025038719177246094, -0.001644134521484375, -0.0007843971252441406, 7.534027099609375e-05, 0.0009350776672363281, 0.0017948150634765625, 0.002654552459716797, 0.0035142898559570312, 0.004374027252197266, 0.0052337646484375, 0.006093502044677734, 0.006953239440917969, 0.007812976837158203, 0.008672714233398438, 0.009532451629638672, 0.010392189025878906, 0.01125192642211914, 0.012111663818359375, 0.01297140121459961, 0.013831138610839844, 0.014690876007080078, 0.015550613403320312, 0.016410350799560547, 0.01727008819580078, 0.018129825592041016, 0.01898956298828125, 0.019849300384521484, 0.02070903778076172, 0.021568775177001953, 0.022428512573242188, 0.023288249969482422, 0.024147987365722656, 0.02500772476196289, 0.025867462158203125, 0.02672719955444336, 0.027586936950683594, 0.028446674346923828, 0.029306411743164062, 0.030166149139404297, 0.03102588653564453, 0.031885623931884766, 0.032745361328125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 5.0, 2.0, 6.0, 10.0, 10.0, 10.0, 12.0, 24.0, 27.0, 46.0, 52.0, 87.0, 117.0, 153.0, 239.0, 320.0, 547.0, 778.0, 1328.0, 2186.0, 4249.0, 9393.0, 29317.0, 241268.0, 671234.0, 59818.0, 14201.0, 5749.0, 2778.0, 1607.0, 970.0, 655.0, 412.0, 280.0, 199.0, 131.0, 91.0, 76.0, 40.0, 39.0, 23.0, 19.0, 15.0, 12.0, 8.0, 7.0, 6.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.017822265625, -0.017251253128051758, -0.016680240631103516, -0.016109228134155273, -0.015538215637207031, -0.014967203140258789, -0.014396190643310547, -0.013825178146362305, -0.013254165649414062, -0.01268315315246582, -0.012112140655517578, -0.011541128158569336, -0.010970115661621094, -0.010399103164672852, -0.00982809066772461, -0.009257078170776367, -0.008686065673828125, -0.008115053176879883, -0.007544040679931641, -0.0069730281829833984, -0.006402015686035156, -0.005831003189086914, -0.005259990692138672, -0.00468897819519043, -0.0041179656982421875, -0.0035469532012939453, -0.002975940704345703, -0.002404928207397461, -0.0018339157104492188, -0.0012629032135009766, -0.0006918907165527344, -0.00012087821960449219, 0.00045013427734375, 0.0010211467742919922, 0.0015921592712402344, 0.0021631717681884766, 0.0027341842651367188, 0.003305196762084961, 0.003876209259033203, 0.004447221755981445, 0.0050182342529296875, 0.00558924674987793, 0.006160259246826172, 0.006731271743774414, 0.007302284240722656, 0.007873296737670898, 0.00844430923461914, 0.009015321731567383, 0.009586334228515625, 0.010157346725463867, 0.01072835922241211, 0.011299371719360352, 0.011870384216308594, 0.012441396713256836, 0.013012409210205078, 0.01358342170715332, 0.014154434204101562, 0.014725446701049805, 0.015296459197998047, 0.01586747169494629, 0.01643848419189453, 0.017009496688842773, 0.017580509185791016, 0.018151521682739258, 0.0187225341796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 6.0, 4.0, 8.0, 15.0, 23.0, 18.0, 32.0, 43.0, 69.0, 89.0, 108.0, 164.0, 117.0, 89.0, 63.0, 49.0, 22.0, 22.0, 13.0, 8.0, 6.0, 3.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.673833847045898e-05, -9.393226355314255e-05, -9.112618863582611e-05, -8.832011371850967e-05, -8.551403880119324e-05, -8.27079638838768e-05, -7.990188896656036e-05, -7.709581404924393e-05, -7.428973913192749e-05, -7.148366421461105e-05, -6.867758929729462e-05, -6.587151437997818e-05, -6.306543946266174e-05, -6.0259364545345306e-05, -5.745328962802887e-05, -5.464721471071243e-05, -5.1841139793395996e-05, -4.903506487607956e-05, -4.622898995876312e-05, -4.3422915041446686e-05, -4.061684012413025e-05, -3.781076520681381e-05, -3.5004690289497375e-05, -3.219861537218094e-05, -2.9392540454864502e-05, -2.6586465537548065e-05, -2.378039062023163e-05, -2.097431570291519e-05, -1.8168240785598755e-05, -1.5362165868282318e-05, -1.2556090950965881e-05, -9.750016033649445e-06, -6.943941116333008e-06, -4.137866199016571e-06, -1.3317912817001343e-06, 1.4742836356163025e-06, 4.280358552932739e-06, 7.086433470249176e-06, 9.892508387565613e-06, 1.269858330488205e-05, 1.5504658222198486e-05, 1.8310733139514923e-05, 2.111680805683136e-05, 2.3922882974147797e-05, 2.6728957891464233e-05, 2.953503280878067e-05, 3.234110772609711e-05, 3.5147182643413544e-05, 3.795325756072998e-05, 4.075933247804642e-05, 4.3565407395362854e-05, 4.637148231267929e-05, 4.917755722999573e-05, 5.1983632147312164e-05, 5.47897070646286e-05, 5.759578198194504e-05, 6.0401856899261475e-05, 6.320793181657791e-05, 6.601400673389435e-05, 6.882008165121078e-05, 7.162615656852722e-05, 7.443223148584366e-05, 7.72383064031601e-05, 8.004438132047653e-05, 8.285045623779297e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 8.0, 14.0, 10.0, 32.0, 31.0, 67.0, 99.0, 149.0, 319.0, 480.0, 967.0, 1747.0, 3287.0, 7466.0, 19941.0, 73627.0, 539350.0, 322669.0, 50768.0, 15253.0, 6158.0, 2761.0, 1441.0, 791.0, 446.0, 255.0, 136.0, 88.0, 51.0, 35.0, 22.0, 23.0, 10.0, 5.0, 7.0, 4.0, 3.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0135345458984375, -0.013109922409057617, -0.012685298919677734, -0.012260675430297852, -0.011836051940917969, -0.011411428451538086, -0.010986804962158203, -0.01056218147277832, -0.010137557983398438, -0.009712934494018555, -0.009288311004638672, -0.008863687515258789, -0.008439064025878906, -0.008014440536499023, -0.007589817047119141, -0.007165193557739258, -0.006740570068359375, -0.006315946578979492, -0.005891323089599609, -0.0054666996002197266, -0.005042076110839844, -0.004617452621459961, -0.004192829132080078, -0.0037682056427001953, -0.0033435821533203125, -0.0029189586639404297, -0.002494335174560547, -0.002069711685180664, -0.0016450881958007812, -0.0012204647064208984, -0.0007958412170410156, -0.0003712177276611328, 5.340576171875e-05, 0.0004780292510986328, 0.0009026527404785156, 0.0013272762298583984, 0.0017518997192382812, 0.002176523208618164, 0.002601146697998047, 0.0030257701873779297, 0.0034503936767578125, 0.0038750171661376953, 0.004299640655517578, 0.004724264144897461, 0.005148887634277344, 0.0055735111236572266, 0.005998134613037109, 0.006422758102416992, 0.006847381591796875, 0.007272005081176758, 0.007696628570556641, 0.008121252059936523, 0.008545875549316406, 0.008970499038696289, 0.009395122528076172, 0.009819746017456055, 0.010244369506835938, 0.01066899299621582, 0.011093616485595703, 0.011518239974975586, 0.011942863464355469, 0.012367486953735352, 0.012792110443115234, 0.013216733932495117, 0.013641357421875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 3.0, 6.0, 3.0, 4.0, 4.0, 7.0, 5.0, 17.0, 8.0, 22.0, 26.0, 50.0, 110.0, 254.0, 219.0, 110.0, 45.0, 22.0, 13.0, 11.0, 14.0, 10.0, 6.0, 3.0, 3.0, 7.0, 2.0, 4.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0184783935546875, -0.017933368682861328, -0.017388343811035156, -0.016843318939208984, -0.016298294067382812, -0.01575326919555664, -0.015208244323730469, -0.014663219451904297, -0.014118194580078125, -0.013573169708251953, -0.013028144836425781, -0.01248311996459961, -0.011938095092773438, -0.011393070220947266, -0.010848045349121094, -0.010303020477294922, -0.00975799560546875, -0.009212970733642578, -0.008667945861816406, -0.008122920989990234, -0.0075778961181640625, -0.007032871246337891, -0.006487846374511719, -0.005942821502685547, -0.005397796630859375, -0.004852771759033203, -0.004307746887207031, -0.0037627220153808594, -0.0032176971435546875, -0.0026726722717285156, -0.0021276473999023438, -0.0015826225280761719, -0.00103759765625, -0.0004925727844238281, 5.245208740234375e-05, 0.0005974769592285156, 0.0011425018310546875, 0.0016875267028808594, 0.0022325515747070312, 0.002777576446533203, 0.003322601318359375, 0.003867626190185547, 0.004412651062011719, 0.004957675933837891, 0.0055027008056640625, 0.006047725677490234, 0.006592750549316406, 0.007137775421142578, 0.00768280029296875, 0.008227825164794922, 0.008772850036621094, 0.009317874908447266, 0.009862899780273438, 0.01040792465209961, 0.010952949523925781, 0.011497974395751953, 0.012042999267578125, 0.012588024139404297, 0.013133049011230469, 0.01367807388305664, 0.014223098754882812, 0.014768123626708984, 0.015313148498535156, 0.015858173370361328, 0.0164031982421875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 7.0, 17.0, 50.0, 210.0, 386.0, 207.0, 82.0, 30.0, 8.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21220669150352478, -0.20177192986011505, -0.19133715331554413, -0.1809023916721344, -0.17046761512756348, -0.16003285348415375, -0.14959809184074402, -0.1391633152961731, -0.12872855365276337, -0.11829378455877304, -0.10785901546478271, -0.09742425382137299, -0.08698948472738266, -0.07655471563339233, -0.0661199539899826, -0.05568518489599228, -0.04525041580200195, -0.03481564670801163, -0.0243808813393116, -0.013946115970611572, -0.0035113468766212463, 0.00692342221736908, 0.01735818386077881, 0.027792952954769135, 0.03822772204875946, 0.048662491142749786, 0.059097256511449814, 0.06953202188014984, 0.07996679097414017, 0.0904015600681305, 0.10083632171154022, 0.11127109080553055, 0.12170583009719849, 0.13214059174060822, 0.14257536828517914, 0.15301012992858887, 0.1634449064731598, 0.17387966811656952, 0.18431442975997925, 0.19474920630455017, 0.2051839679479599, 0.21561872959136963, 0.22605350613594055, 0.23648826777935028, 0.24692302942276, 0.25735780596733093, 0.26779258251190186, 0.2782273292541504, 0.2886621057987213, 0.29909688234329224, 0.30953162908554077, 0.3199664056301117, 0.3304011821746826, 0.34083592891693115, 0.3512707054615021, 0.361705482006073, 0.37214022874832153, 0.38257500529289246, 0.393009752035141, 0.4034445285797119, 0.41387930512428284, 0.42431408166885376, 0.4347488284111023, 0.4451836049556732, 0.45561838150024414]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 6.0, 1.0, 7.0, 6.0, 14.0, 10.0, 11.0, 18.0, 25.0, 29.0, 31.0, 43.0, 58.0, 60.0, 54.0, 56.0, 55.0, 69.0, 57.0, 47.0, 41.0, 44.0, 54.0, 32.0, 32.0, 32.0, 19.0, 22.0, 21.0, 14.0, 12.0, 6.0, 6.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06769245862960815, -0.06512940675020218, -0.0625663548707962, -0.06000330671668053, -0.05744025483727455, -0.054877202957868576, -0.0523141548037529, -0.049751102924346924, -0.04718805104494095, -0.04462499916553497, -0.042061947286129, -0.03949889913201332, -0.036935847252607346, -0.03437279537320137, -0.03180974721908569, -0.029246695339679718, -0.026683643460273743, -0.024120591580867767, -0.02155754156410694, -0.018994491547346115, -0.01643143966794014, -0.013868388719856739, -0.011305337771773338, -0.008742287755012512, -0.006179235875606537, -0.003616184927523136, -0.0010531339794397354, 0.0015099169686436653, 0.004072967916727066, 0.006636018864810467, 0.009199069812893867, 0.011762119829654694, 0.014325171709060669, 0.016888223588466644, 0.01945127360522747, 0.022014323621988297, 0.024577375501394272, 0.027140427380800247, 0.029703477397561073, 0.0322665274143219, 0.034829579293727875, 0.03739263117313385, 0.039955683052539825, 0.0425187312066555, 0.04508178308606148, 0.04764483496546745, 0.05020788311958313, 0.052770934998989105, 0.05533398687839508, 0.057897038757801056, 0.06046009063720703, 0.063023142516613, 0.06558619439601898, 0.06814923882484436, 0.07071229070425034, 0.07327534258365631, 0.07583839446306229, 0.07840144634246826, 0.08096449822187424, 0.08352755010128021, 0.08609059453010559, 0.08865364640951157, 0.09121669828891754, 0.09377975016832352, 0.09634280204772949]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 4.0, 5.0, 7.0, 14.0, 26.0, 33.0, 52.0, 100.0, 196.0, 450.0, 1409.0, 7710.0, 107363.0, 3982209.0, 85616.0, 6861.0, 1405.0, 421.0, 186.0, 93.0, 48.0, 29.0, 19.0, 9.0, 8.0, 7.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044586181640625, -0.04312276840209961, -0.04165935516357422, -0.04019594192504883, -0.03873252868652344, -0.03726911544799805, -0.035805702209472656, -0.034342288970947266, -0.032878875732421875, -0.031415462493896484, -0.029952049255371094, -0.028488636016845703, -0.027025222778320312, -0.025561809539794922, -0.02409839630126953, -0.02263498306274414, -0.02117156982421875, -0.01970815658569336, -0.01824474334716797, -0.016781330108642578, -0.015317916870117188, -0.013854503631591797, -0.012391090393066406, -0.010927677154541016, -0.009464263916015625, -0.008000850677490234, -0.006537437438964844, -0.005074024200439453, -0.0036106109619140625, -0.002147197723388672, -0.0006837844848632812, 0.0007796287536621094, 0.0022430419921875, 0.0037064552307128906, 0.005169868469238281, 0.006633281707763672, 0.008096694946289062, 0.009560108184814453, 0.011023521423339844, 0.012486934661865234, 0.013950347900390625, 0.015413761138916016, 0.016877174377441406, 0.018340587615966797, 0.019804000854492188, 0.021267414093017578, 0.02273082733154297, 0.02419424057006836, 0.02565765380859375, 0.02712106704711914, 0.02858448028564453, 0.030047893524169922, 0.03151130676269531, 0.0329747200012207, 0.034438133239746094, 0.035901546478271484, 0.037364959716796875, 0.038828372955322266, 0.040291786193847656, 0.04175519943237305, 0.04321861267089844, 0.04468202590942383, 0.04614543914794922, 0.04760885238647461, 0.049072265625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 12.0, 33.0, 71.0, 119.0, 166.0, 177.0, 152.0, 132.0, 71.0, 40.0, 17.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.024810791015625, -0.024048566818237305, -0.02328634262084961, -0.022524118423461914, -0.02176189422607422, -0.020999670028686523, -0.020237445831298828, -0.019475221633911133, -0.018712997436523438, -0.017950773239135742, -0.017188549041748047, -0.01642632484436035, -0.015664100646972656, -0.014901876449584961, -0.014139652252197266, -0.01337742805480957, -0.012615203857421875, -0.01185297966003418, -0.011090755462646484, -0.010328531265258789, -0.009566307067871094, -0.008804082870483398, -0.008041858673095703, -0.007279634475708008, -0.0065174102783203125, -0.005755186080932617, -0.004992961883544922, -0.0042307376861572266, -0.0034685134887695312, -0.002706289291381836, -0.0019440650939941406, -0.0011818408966064453, -0.00041961669921875, 0.0003426074981689453, 0.0011048316955566406, 0.001867055892944336, 0.0026292800903320312, 0.0033915042877197266, 0.004153728485107422, 0.004915952682495117, 0.0056781768798828125, 0.006440401077270508, 0.007202625274658203, 0.007964849472045898, 0.008727073669433594, 0.009489297866821289, 0.010251522064208984, 0.01101374626159668, 0.011775970458984375, 0.01253819465637207, 0.013300418853759766, 0.014062643051147461, 0.014824867248535156, 0.015587091445922852, 0.016349315643310547, 0.017111539840698242, 0.017873764038085938, 0.018635988235473633, 0.019398212432861328, 0.020160436630249023, 0.02092266082763672, 0.021684885025024414, 0.02244710922241211, 0.023209333419799805, 0.0239715576171875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 10.0, 3.0, 11.0, 13.0, 19.0, 31.0, 57.0, 90.0, 149.0, 272.0, 501.0, 931.0, 2176.0, 5190.0, 16322.0, 79628.0, 1525268.0, 2436574.0, 97489.0, 18870.0, 5881.0, 2390.0, 1134.0, 552.0, 309.0, 165.0, 77.0, 60.0, 36.0, 14.0, 20.0, 15.0, 11.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.029022216796875, -0.028169870376586914, -0.027317523956298828, -0.026465177536010742, -0.025612831115722656, -0.02476048469543457, -0.023908138275146484, -0.0230557918548584, -0.022203445434570312, -0.021351099014282227, -0.02049875259399414, -0.019646406173706055, -0.01879405975341797, -0.017941713333129883, -0.017089366912841797, -0.01623702049255371, -0.015384674072265625, -0.014532327651977539, -0.013679981231689453, -0.012827634811401367, -0.011975288391113281, -0.011122941970825195, -0.01027059555053711, -0.009418249130249023, -0.008565902709960938, -0.0077135562896728516, -0.006861209869384766, -0.00600886344909668, -0.005156517028808594, -0.004304170608520508, -0.003451824188232422, -0.002599477767944336, -0.00174713134765625, -0.0008947849273681641, -4.2438507080078125e-05, 0.0008099079132080078, 0.0016622543334960938, 0.0025146007537841797, 0.0033669471740722656, 0.0042192935943603516, 0.0050716400146484375, 0.0059239864349365234, 0.006776332855224609, 0.007628679275512695, 0.008481025695800781, 0.009333372116088867, 0.010185718536376953, 0.011038064956665039, 0.011890411376953125, 0.012742757797241211, 0.013595104217529297, 0.014447450637817383, 0.015299797058105469, 0.016152143478393555, 0.01700448989868164, 0.017856836318969727, 0.018709182739257812, 0.0195615291595459, 0.020413875579833984, 0.02126622200012207, 0.022118568420410156, 0.022970914840698242, 0.023823261260986328, 0.024675607681274414, 0.0255279541015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 5.0, 2.0, 9.0, 12.0, 13.0, 18.0, 28.0, 52.0, 78.0, 105.0, 248.0, 480.0, 1193.0, 935.0, 356.0, 223.0, 113.0, 68.0, 45.0, 24.0, 17.0, 21.0, 5.0, 11.0, 2.0, 1.0, 1.0, 3.0, 4.0, 5.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0276641845703125, -0.02689075469970703, -0.026117324829101562, -0.025343894958496094, -0.024570465087890625, -0.023797035217285156, -0.023023605346679688, -0.02225017547607422, -0.02147674560546875, -0.02070331573486328, -0.019929885864257812, -0.019156455993652344, -0.018383026123046875, -0.017609596252441406, -0.016836166381835938, -0.01606273651123047, -0.015289306640625, -0.014515876770019531, -0.013742446899414062, -0.012969017028808594, -0.012195587158203125, -0.011422157287597656, -0.010648727416992188, -0.009875297546386719, -0.00910186767578125, -0.008328437805175781, -0.0075550079345703125, -0.006781578063964844, -0.006008148193359375, -0.005234718322753906, -0.0044612884521484375, -0.0036878585815429688, -0.0029144287109375, -0.0021409988403320312, -0.0013675689697265625, -0.0005941390991210938, 0.000179290771484375, 0.0009527206420898438, 0.0017261505126953125, 0.0024995803833007812, 0.00327301025390625, 0.004046440124511719, 0.0048198699951171875, 0.005593299865722656, 0.006366729736328125, 0.007140159606933594, 0.007913589477539062, 0.008687019348144531, 0.00946044921875, 0.010233879089355469, 0.011007308959960938, 0.011780738830566406, 0.012554168701171875, 0.013327598571777344, 0.014101028442382812, 0.014874458312988281, 0.01564788818359375, 0.01642131805419922, 0.017194747924804688, 0.017968177795410156, 0.018741607666015625, 0.019515037536621094, 0.020288467407226562, 0.02106189727783203, 0.0218353271484375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 6.0, 10.0, 29.0, 39.0, 128.0, 247.0, 291.0, 145.0, 51.0, 38.0, 8.0, 4.0, 2.0, 0.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.32973966002464294, -0.32270506024360657, -0.3156704902648926, -0.3086358904838562, -0.3016012907028198, -0.29456669092178345, -0.28753212094306946, -0.2804975211620331, -0.2734629213809967, -0.2664283215999603, -0.25939375162124634, -0.25235915184020996, -0.24532455205917358, -0.2382899671792984, -0.23125536739826202, -0.22422078251838684, -0.21718618273735046, -0.21015159785747528, -0.2031169980764389, -0.19608241319656372, -0.18904781341552734, -0.18201322853565216, -0.17497862875461578, -0.1679440438747406, -0.16090945899486542, -0.15387487411499023, -0.14684027433395386, -0.13980568945407867, -0.1327710896730423, -0.12573650479316711, -0.11870190501213074, -0.11166732013225555, -0.10463272035121918, -0.0975981280207634, -0.09056353569030762, -0.08352894335985184, -0.07649435102939606, -0.06945976614952087, -0.062425170093774796, -0.055390577763319016, -0.048355985432863235, -0.041321393102407455, -0.034286800771951675, -0.027252210304141045, -0.020217617973685265, -0.013183027505874634, -0.006148435175418854, 0.0008861571550369263, 0.007920749485492706, 0.014955341815948486, 0.021989934146404266, 0.029024524614214897, 0.036059118807315826, 0.04309370741248131, 0.05012829974293709, 0.05716289207339287, 0.06419748067855835, 0.07123207300901413, 0.07826666533946991, 0.08530125766992569, 0.09233585000038147, 0.09937043488025665, 0.10640503466129303, 0.11343961954116821, 0.12047421932220459]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 3.0, 10.0, 12.0, 12.0, 17.0, 28.0, 20.0, 28.0, 31.0, 43.0, 39.0, 40.0, 45.0, 58.0, 54.0, 66.0, 54.0, 60.0, 60.0, 53.0, 45.0, 45.0, 31.0, 27.0, 20.0, 27.0, 16.0, 14.0, 10.0, 8.0, 9.0, 4.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08672666549682617, -0.0843854695558548, -0.08204426616430283, -0.07970306277275085, -0.07736186683177948, -0.0750206708908081, -0.07267946749925613, -0.07033826410770416, -0.06799706816673279, -0.06565587222576141, -0.06331466883420944, -0.06097346916794777, -0.058632269501686096, -0.05629106983542442, -0.05394987016916275, -0.05160867050290108, -0.049267470836639404, -0.04692627117037773, -0.04458507150411606, -0.042243871837854385, -0.03990267217159271, -0.03756147250533104, -0.035220272839069366, -0.032879073172807693, -0.03053787350654602, -0.028196673840284348, -0.025855474174022675, -0.023514274507761, -0.02117307484149933, -0.018831875175237656, -0.016490675508975983, -0.01414947584271431, -0.011808276176452637, -0.009467076510190964, -0.007125876843929291, -0.004784677177667618, -0.002443477511405945, -0.00010227784514427185, 0.002238921821117401, 0.004580121487379074, 0.006921321153640747, 0.00926252081990242, 0.011603720486164093, 0.013944920152425766, 0.01628611981868744, 0.018627319484949112, 0.020968519151210785, 0.023309718817472458, 0.02565091848373413, 0.027992118149995804, 0.030333317816257477, 0.03267451748251915, 0.03501571714878082, 0.037356916815042496, 0.03969811648130417, 0.04203931614756584, 0.044380515813827515, 0.04672171548008919, 0.04906291514635086, 0.051404114812612534, 0.05374531447887421, 0.05608651414513588, 0.05842771381139755, 0.060768913477659225, 0.0631101131439209]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 3.0, 8.0, 6.0, 6.0, 6.0, 11.0, 12.0, 25.0, 23.0, 40.0, 74.0, 92.0, 133.0, 218.0, 307.0, 532.0, 931.0, 2234.0, 8955.0, 82462.0, 738644.0, 192081.0, 15697.0, 3180.0, 1217.0, 547.0, 375.0, 232.0, 132.0, 110.0, 67.0, 52.0, 37.0, 30.0, 24.0, 15.0, 7.0, 5.0, 7.0, 6.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0574951171875, -0.055619239807128906, -0.05374336242675781, -0.05186748504638672, -0.049991607666015625, -0.04811573028564453, -0.04623985290527344, -0.044363975524902344, -0.04248809814453125, -0.040612220764160156, -0.03873634338378906, -0.03686046600341797, -0.034984588623046875, -0.03310871124267578, -0.031232833862304688, -0.029356956481933594, -0.0274810791015625, -0.025605201721191406, -0.023729324340820312, -0.02185344696044922, -0.019977569580078125, -0.01810169219970703, -0.016225814819335938, -0.014349937438964844, -0.01247406005859375, -0.010598182678222656, -0.008722305297851562, -0.006846427917480469, -0.004970550537109375, -0.0030946731567382812, -0.0012187957763671875, 0.0006570816040039062, 0.002532958984375, 0.004408836364746094, 0.0062847137451171875, 0.008160591125488281, 0.010036468505859375, 0.011912345886230469, 0.013788223266601562, 0.015664100646972656, 0.01753997802734375, 0.019415855407714844, 0.021291732788085938, 0.02316761016845703, 0.025043487548828125, 0.02691936492919922, 0.028795242309570312, 0.030671119689941406, 0.0325469970703125, 0.034422874450683594, 0.03629875183105469, 0.03817462921142578, 0.040050506591796875, 0.04192638397216797, 0.04380226135253906, 0.045678138732910156, 0.04755401611328125, 0.049429893493652344, 0.05130577087402344, 0.05318164825439453, 0.055057525634765625, 0.05693340301513672, 0.05880928039550781, 0.060685157775878906, 0.06256103515625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 39.0, 82.0, 120.0, 166.0, 166.0, 144.0, 123.0, 73.0, 50.0, 16.0, 5.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.027191162109375, -0.026380300521850586, -0.025569438934326172, -0.024758577346801758, -0.023947715759277344, -0.02313685417175293, -0.022325992584228516, -0.0215151309967041, -0.020704269409179688, -0.019893407821655273, -0.01908254623413086, -0.018271684646606445, -0.01746082305908203, -0.016649961471557617, -0.015839099884033203, -0.015028238296508789, -0.014217376708984375, -0.013406515121459961, -0.012595653533935547, -0.011784791946411133, -0.010973930358886719, -0.010163068771362305, -0.00935220718383789, -0.008541345596313477, -0.0077304840087890625, -0.0069196224212646484, -0.006108760833740234, -0.00529789924621582, -0.004487037658691406, -0.003676176071166992, -0.002865314483642578, -0.002054452896118164, -0.00124359130859375, -0.00043272972106933594, 0.0003781318664550781, 0.0011889934539794922, 0.0019998550415039062, 0.0028107166290283203, 0.0036215782165527344, 0.0044324398040771484, 0.0052433013916015625, 0.0060541629791259766, 0.006865024566650391, 0.007675886154174805, 0.008486747741699219, 0.009297609329223633, 0.010108470916748047, 0.010919332504272461, 0.011730194091796875, 0.012541055679321289, 0.013351917266845703, 0.014162778854370117, 0.014973640441894531, 0.015784502029418945, 0.01659536361694336, 0.017406225204467773, 0.018217086791992188, 0.0190279483795166, 0.019838809967041016, 0.02064967155456543, 0.021460533142089844, 0.022271394729614258, 0.023082256317138672, 0.023893117904663086, 0.0247039794921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 4.0, 3.0, 5.0, 10.0, 16.0, 10.0, 14.0, 25.0, 45.0, 52.0, 114.0, 179.0, 289.0, 484.0, 851.0, 1601.0, 3116.0, 6278.0, 13697.0, 33161.0, 88003.0, 235090.0, 357649.0, 189396.0, 69216.0, 26810.0, 11445.0, 5144.0, 2631.0, 1327.0, 764.0, 424.0, 285.0, 172.0, 89.0, 57.0, 28.0, 27.0, 12.0, 10.0, 7.0, 9.0, 4.0, 8.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.022674560546875, -0.02199530601501465, -0.021316051483154297, -0.020636796951293945, -0.019957542419433594, -0.019278287887573242, -0.01859903335571289, -0.01791977882385254, -0.017240524291992188, -0.016561269760131836, -0.015882015228271484, -0.015202760696411133, -0.014523506164550781, -0.01384425163269043, -0.013164997100830078, -0.012485742568969727, -0.011806488037109375, -0.011127233505249023, -0.010447978973388672, -0.00976872444152832, -0.009089469909667969, -0.008410215377807617, -0.007730960845947266, -0.007051706314086914, -0.0063724517822265625, -0.005693197250366211, -0.005013942718505859, -0.004334688186645508, -0.0036554336547851562, -0.0029761791229248047, -0.002296924591064453, -0.0016176700592041016, -0.00093841552734375, -0.00025916099548339844, 0.0004200935363769531, 0.0010993480682373047, 0.0017786026000976562, 0.002457857131958008, 0.0031371116638183594, 0.003816366195678711, 0.0044956207275390625, 0.005174875259399414, 0.005854129791259766, 0.006533384323120117, 0.007212638854980469, 0.00789189338684082, 0.008571147918701172, 0.009250402450561523, 0.009929656982421875, 0.010608911514282227, 0.011288166046142578, 0.01196742057800293, 0.012646675109863281, 0.013325929641723633, 0.014005184173583984, 0.014684438705444336, 0.015363693237304688, 0.01604294776916504, 0.01672220230102539, 0.017401456832885742, 0.018080711364746094, 0.018759965896606445, 0.019439220428466797, 0.02011847496032715, 0.0207977294921875]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 6.0, 9.0, 3.0, 8.0, 15.0, 7.0, 12.0, 18.0, 25.0, 33.0, 30.0, 29.0, 31.0, 38.0, 59.0, 49.0, 54.0, 43.0, 56.0, 53.0, 40.0, 45.0, 55.0, 30.0, 39.0, 29.0, 30.0, 30.0, 24.0, 24.0, 19.0, 19.0, 10.0, 9.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0234375, -0.02261519432067871, -0.021792888641357422, -0.020970582962036133, -0.020148277282714844, -0.019325971603393555, -0.018503665924072266, -0.017681360244750977, -0.016859054565429688, -0.0160367488861084, -0.01521444320678711, -0.01439213752746582, -0.013569831848144531, -0.012747526168823242, -0.011925220489501953, -0.011102914810180664, -0.010280609130859375, -0.009458303451538086, -0.008635997772216797, -0.007813692092895508, -0.006991386413574219, -0.00616908073425293, -0.005346775054931641, -0.0045244693756103516, -0.0037021636962890625, -0.0028798580169677734, -0.0020575523376464844, -0.0012352466583251953, -0.00041294097900390625, 0.0004093647003173828, 0.0012316703796386719, 0.002053976058959961, 0.00287628173828125, 0.003698587417602539, 0.004520893096923828, 0.005343198776245117, 0.006165504455566406, 0.006987810134887695, 0.007810115814208984, 0.008632421493530273, 0.009454727172851562, 0.010277032852172852, 0.01109933853149414, 0.01192164421081543, 0.012743949890136719, 0.013566255569458008, 0.014388561248779297, 0.015210866928100586, 0.016033172607421875, 0.016855478286743164, 0.017677783966064453, 0.018500089645385742, 0.01932239532470703, 0.02014470100402832, 0.02096700668334961, 0.0217893123626709, 0.022611618041992188, 0.023433923721313477, 0.024256229400634766, 0.025078535079956055, 0.025900840759277344, 0.026723146438598633, 0.027545452117919922, 0.02836775779724121, 0.0291900634765625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 6.0, 9.0, 14.0, 24.0, 31.0, 57.0, 68.0, 89.0, 117.0, 209.0, 339.0, 513.0, 755.0, 1249.0, 1898.0, 3327.0, 5894.0, 10966.0, 22319.0, 50442.0, 133286.0, 357922.0, 283258.0, 97592.0, 38851.0, 17867.0, 8845.0, 4963.0, 2866.0, 1736.0, 1047.0, 667.0, 456.0, 273.0, 208.0, 131.0, 73.0, 59.0, 38.0, 25.0, 19.0, 16.0, 6.0, 11.0, 4.0, 6.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.00896453857421875, -0.008683085441589355, -0.008401632308959961, -0.008120179176330566, -0.007838726043701172, -0.007557272911071777, -0.007275819778442383, -0.006994366645812988, -0.006712913513183594, -0.006431460380554199, -0.006150007247924805, -0.00586855411529541, -0.005587100982666016, -0.005305647850036621, -0.0050241947174072266, -0.004742741584777832, -0.0044612884521484375, -0.004179835319519043, -0.0038983821868896484, -0.003616929054260254, -0.0033354759216308594, -0.003054022789001465, -0.0027725696563720703, -0.0024911165237426758, -0.0022096633911132812, -0.0019282102584838867, -0.0016467571258544922, -0.0013653039932250977, -0.0010838508605957031, -0.0008023977279663086, -0.0005209445953369141, -0.00023949146270751953, 4.1961669921875e-05, 0.00032341480255126953, 0.0006048679351806641, 0.0008863210678100586, 0.0011677742004394531, 0.0014492273330688477, 0.0017306804656982422, 0.0020121335983276367, 0.0022935867309570312, 0.0025750398635864258, 0.0028564929962158203, 0.003137946128845215, 0.0034193992614746094, 0.003700852394104004, 0.0039823055267333984, 0.004263758659362793, 0.0045452117919921875, 0.004826664924621582, 0.0051081180572509766, 0.005389571189880371, 0.005671024322509766, 0.00595247745513916, 0.006233930587768555, 0.006515383720397949, 0.006796836853027344, 0.007078289985656738, 0.007359743118286133, 0.007641196250915527, 0.007922649383544922, 0.008204102516174316, 0.008485555648803711, 0.008767008781433105, 0.0090484619140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 2.0, 8.0, 5.0, 5.0, 7.0, 11.0, 8.0, 15.0, 10.0, 38.0, 28.0, 41.0, 48.0, 62.0, 73.0, 90.0, 91.0, 88.0, 75.0, 52.0, 48.0, 42.0, 28.0, 27.0, 19.0, 17.0, 13.0, 10.0, 8.0, 6.0, 4.0, 7.0, 3.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.012222290039062e-05, -8.743628859519958e-05, -8.475035429000854e-05, -8.20644199848175e-05, -7.937848567962646e-05, -7.669255137443542e-05, -7.400661706924438e-05, -7.132068276405334e-05, -6.86347484588623e-05, -6.594881415367126e-05, -6.326287984848022e-05, -6.0576945543289185e-05, -5.7891011238098145e-05, -5.5205076932907104e-05, -5.2519142627716064e-05, -4.9833208322525024e-05, -4.7147274017333984e-05, -4.4461339712142944e-05, -4.1775405406951904e-05, -3.9089471101760864e-05, -3.6403536796569824e-05, -3.3717602491378784e-05, -3.1031668186187744e-05, -2.8345733880996704e-05, -2.5659799575805664e-05, -2.2973865270614624e-05, -2.0287930965423584e-05, -1.7601996660232544e-05, -1.4916062355041504e-05, -1.2230128049850464e-05, -9.544193744659424e-06, -6.858259439468384e-06, -4.172325134277344e-06, -1.4863908290863037e-06, 1.1995434761047363e-06, 3.885477781295776e-06, 6.571412086486816e-06, 9.257346391677856e-06, 1.1943280696868896e-05, 1.4629215002059937e-05, 1.7315149307250977e-05, 2.0001083612442017e-05, 2.2687017917633057e-05, 2.5372952222824097e-05, 2.8058886528015137e-05, 3.074482083320618e-05, 3.343075513839722e-05, 3.611668944358826e-05, 3.88026237487793e-05, 4.148855805397034e-05, 4.417449235916138e-05, 4.686042666435242e-05, 4.954636096954346e-05, 5.22322952747345e-05, 5.491822957992554e-05, 5.760416388511658e-05, 6.029009819030762e-05, 6.297603249549866e-05, 6.56619668006897e-05, 6.834790110588074e-05, 7.103383541107178e-05, 7.371976971626282e-05, 7.640570402145386e-05, 7.90916383266449e-05, 8.177757263183594e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 4.0, 4.0, 4.0, 9.0, 12.0, 21.0, 28.0, 36.0, 64.0, 104.0, 196.0, 342.0, 721.0, 1369.0, 2643.0, 5326.0, 11628.0, 28025.0, 77713.0, 261495.0, 432523.0, 144550.0, 47326.0, 18531.0, 8067.0, 3801.0, 1883.0, 920.0, 506.0, 268.0, 153.0, 94.0, 52.0, 42.0, 27.0, 19.0, 12.0, 8.0, 3.0, 9.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0], "bins": [-0.01181793212890625, -0.01147305965423584, -0.01112818717956543, -0.01078331470489502, -0.01043844223022461, -0.0100935697555542, -0.009748697280883789, -0.009403824806213379, -0.009058952331542969, -0.008714079856872559, -0.008369207382202148, -0.008024334907531738, -0.007679462432861328, -0.007334589958190918, -0.006989717483520508, -0.006644845008850098, -0.0062999725341796875, -0.005955100059509277, -0.005610227584838867, -0.005265355110168457, -0.004920482635498047, -0.004575610160827637, -0.0042307376861572266, -0.0038858652114868164, -0.0035409927368164062, -0.003196120262145996, -0.002851247787475586, -0.0025063753128051758, -0.0021615028381347656, -0.0018166303634643555, -0.0014717578887939453, -0.0011268854141235352, -0.000782012939453125, -0.00043714046478271484, -9.226799011230469e-05, 0.00025260448455810547, 0.0005974769592285156, 0.0009423494338989258, 0.001287221908569336, 0.001632094383239746, 0.0019769668579101562, 0.0023218393325805664, 0.0026667118072509766, 0.0030115842819213867, 0.003356456756591797, 0.003701329231262207, 0.004046201705932617, 0.004391074180603027, 0.0047359466552734375, 0.005080819129943848, 0.005425691604614258, 0.005770564079284668, 0.006115436553955078, 0.006460309028625488, 0.0068051815032958984, 0.007150053977966309, 0.007494926452636719, 0.007839798927307129, 0.008184671401977539, 0.00852954387664795, 0.00887441635131836, 0.00921928882598877, 0.00956416130065918, 0.00990903377532959, 0.01025390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 2.0, 8.0, 7.0, 6.0, 7.0, 11.0, 11.0, 20.0, 21.0, 20.0, 44.0, 43.0, 48.0, 100.0, 110.0, 119.0, 98.0, 69.0, 72.0, 39.0, 39.0, 30.0, 15.0, 12.0, 15.0, 15.0, 6.0, 3.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0138092041015625, -0.013407349586486816, -0.013005495071411133, -0.01260364055633545, -0.012201786041259766, -0.011799931526184082, -0.011398077011108398, -0.010996222496032715, -0.010594367980957031, -0.010192513465881348, -0.009790658950805664, -0.00938880443572998, -0.008986949920654297, -0.008585095405578613, -0.00818324089050293, -0.007781386375427246, -0.0073795318603515625, -0.006977677345275879, -0.006575822830200195, -0.006173968315124512, -0.005772113800048828, -0.0053702592849731445, -0.004968404769897461, -0.004566550254821777, -0.004164695739746094, -0.00376284122467041, -0.0033609867095947266, -0.002959132194519043, -0.0025572776794433594, -0.0021554231643676758, -0.0017535686492919922, -0.0013517141342163086, -0.000949859619140625, -0.0005480051040649414, -0.0001461505889892578, 0.0002557039260864258, 0.0006575584411621094, 0.001059412956237793, 0.0014612674713134766, 0.0018631219863891602, 0.0022649765014648438, 0.0026668310165405273, 0.003068685531616211, 0.0034705400466918945, 0.003872394561767578, 0.004274249076843262, 0.004676103591918945, 0.005077958106994629, 0.0054798126220703125, 0.005881667137145996, 0.00628352165222168, 0.006685376167297363, 0.007087230682373047, 0.0074890851974487305, 0.007890939712524414, 0.008292794227600098, 0.008694648742675781, 0.009096503257751465, 0.009498357772827148, 0.009900212287902832, 0.010302066802978516, 0.0107039213180542, 0.011105775833129883, 0.011507630348205566, 0.01190948486328125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 3.0, 14.0, 16.0, 28.0, 45.0, 102.0, 126.0, 147.0, 164.0, 114.0, 96.0, 57.0, 37.0, 19.0, 9.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.24636536836624146, -0.24099762737751007, -0.23562990128993988, -0.2302621603012085, -0.2248944342136383, -0.21952669322490692, -0.21415895223617554, -0.20879122614860535, -0.20342348515987396, -0.19805574417114258, -0.1926880180835724, -0.187320277094841, -0.18195253610610962, -0.17658481001853943, -0.17121706902980804, -0.16584932804107666, -0.16048160195350647, -0.15511386096477509, -0.1497461348772049, -0.1443783938884735, -0.13901066780090332, -0.13364292681217194, -0.12827518582344055, -0.12290745228528976, -0.11753971874713898, -0.11217198520898819, -0.1068042516708374, -0.10143651068210602, -0.09606877714395523, -0.09070104360580444, -0.08533330261707306, -0.07996556907892227, -0.07459785044193268, -0.06923011690378189, -0.0638623833656311, -0.05849464237689972, -0.05312690883874893, -0.047759175300598145, -0.04239143803715706, -0.03702370077371597, -0.031655967235565186, -0.02628823183476925, -0.020920496433973312, -0.015552761033177376, -0.01018502563238144, -0.004817290231585503, 0.000550445169210434, 0.00591818243265152, 0.011285915970802307, 0.016653651371598244, 0.02202138677239418, 0.027389122173190117, 0.03275685757398605, 0.03812459111213684, 0.04349232837557793, 0.04886006563901901, 0.0542277991771698, 0.05959553271532059, 0.06496326625347137, 0.07033100724220276, 0.07569874078035355, 0.08106647431850433, 0.08643421530723572, 0.0918019488453865, 0.09716968238353729]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 6.0, 11.0, 10.0, 8.0, 15.0, 8.0, 19.0, 17.0, 20.0, 18.0, 32.0, 28.0, 29.0, 34.0, 50.0, 43.0, 38.0, 39.0, 30.0, 41.0, 50.0, 44.0, 49.0, 43.0, 32.0, 36.0, 25.0, 36.0, 29.0, 22.0, 20.0, 30.0, 30.0, 9.0, 9.0, 11.0, 8.0, 9.0, 2.0, 6.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06681299209594727, -0.06453660130500793, -0.062260210514068604, -0.05998382344841957, -0.05770743265748024, -0.05543104186654091, -0.053154654800891876, -0.050878264009952545, -0.048601873219013214, -0.04632548242807388, -0.04404909163713455, -0.04177270457148552, -0.03949631378054619, -0.03721992298960686, -0.034943535923957825, -0.032667145133018494, -0.030390754342079163, -0.02811436355113983, -0.02583797462284565, -0.023561585694551468, -0.021285194903612137, -0.019008804112672806, -0.016732415184378624, -0.014456026256084442, -0.012179635465145111, -0.009903245605528355, -0.007626855745911598, -0.005350465886294842, -0.0030740760266780853, -0.0007976861670613289, 0.0014787036925554276, 0.0037550926208496094, 0.00603148341178894, 0.008307873271405697, 0.010584263131022453, 0.01286065299063921, 0.015137042850255966, 0.017413433641195297, 0.01968982256948948, 0.02196621149778366, 0.024242602288722992, 0.026518993079662323, 0.028795382007956505, 0.031071770936250687, 0.03334816172719002, 0.03562455251812935, 0.03790093958377838, 0.04017733037471771, 0.04245372116565704, 0.044730111956596375, 0.047006502747535706, 0.04928288981318474, 0.05155928060412407, 0.0538356713950634, 0.05611205846071243, 0.058388449251651764, 0.060664840042591095, 0.06294123083353043, 0.06521762162446976, 0.06749401241540909, 0.06977039575576782, 0.07204678654670715, 0.07432317733764648, 0.07659956812858582, 0.07887595891952515]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 7.0, 4.0, 7.0, 24.0, 24.0, 38.0, 41.0, 78.0, 140.0, 178.0, 428.0, 1157.0, 4082.0, 14666.0, 96326.0, 3365343.0, 662207.0, 38033.0, 7763.0, 2273.0, 761.0, 300.0, 140.0, 97.0, 53.0, 30.0, 25.0, 16.0, 12.0, 12.0, 2.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029541015625, -0.028548717498779297, -0.027556419372558594, -0.02656412124633789, -0.025571823120117188, -0.024579524993896484, -0.02358722686767578, -0.022594928741455078, -0.021602630615234375, -0.020610332489013672, -0.01961803436279297, -0.018625736236572266, -0.017633438110351562, -0.01664113998413086, -0.015648841857910156, -0.014656543731689453, -0.01366424560546875, -0.012671947479248047, -0.011679649353027344, -0.01068735122680664, -0.009695053100585938, -0.008702754974365234, -0.007710456848144531, -0.006718158721923828, -0.005725860595703125, -0.004733562469482422, -0.0037412643432617188, -0.0027489662170410156, -0.0017566680908203125, -0.0007643699645996094, 0.00022792816162109375, 0.0012202262878417969, 0.0022125244140625, 0.003204822540283203, 0.004197120666503906, 0.005189418792724609, 0.0061817169189453125, 0.007174015045166016, 0.008166313171386719, 0.009158611297607422, 0.010150909423828125, 0.011143207550048828, 0.012135505676269531, 0.013127803802490234, 0.014120101928710938, 0.01511240005493164, 0.016104698181152344, 0.017096996307373047, 0.01808929443359375, 0.019081592559814453, 0.020073890686035156, 0.02106618881225586, 0.022058486938476562, 0.023050785064697266, 0.02404308319091797, 0.025035381317138672, 0.026027679443359375, 0.027019977569580078, 0.02801227569580078, 0.029004573822021484, 0.029996871948242188, 0.03098917007446289, 0.031981468200683594, 0.0329737663269043, 0.033966064453125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 31.0, 61.0, 93.0, 138.0, 167.0, 172.0, 127.0, 91.0, 54.0, 40.0, 10.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0282745361328125, -0.027416467666625977, -0.026558399200439453, -0.02570033073425293, -0.024842262268066406, -0.023984193801879883, -0.02312612533569336, -0.022268056869506836, -0.021409988403320312, -0.02055191993713379, -0.019693851470947266, -0.018835783004760742, -0.01797771453857422, -0.017119646072387695, -0.016261577606201172, -0.015403509140014648, -0.014545440673828125, -0.013687372207641602, -0.012829303741455078, -0.011971235275268555, -0.011113166809082031, -0.010255098342895508, -0.009397029876708984, -0.008538961410522461, -0.0076808929443359375, -0.006822824478149414, -0.005964756011962891, -0.005106687545776367, -0.004248619079589844, -0.0033905506134033203, -0.002532482147216797, -0.0016744136810302734, -0.00081634521484375, 4.172325134277344e-05, 0.0008997917175292969, 0.0017578601837158203, 0.0026159286499023438, 0.003473997116088867, 0.004332065582275391, 0.005190134048461914, 0.0060482025146484375, 0.006906270980834961, 0.007764339447021484, 0.008622407913208008, 0.009480476379394531, 0.010338544845581055, 0.011196613311767578, 0.012054681777954102, 0.012912750244140625, 0.013770818710327148, 0.014628887176513672, 0.015486955642700195, 0.01634502410888672, 0.017203092575073242, 0.018061161041259766, 0.01891922950744629, 0.019777297973632812, 0.020635366439819336, 0.02149343490600586, 0.022351503372192383, 0.023209571838378906, 0.02406764030456543, 0.024925708770751953, 0.025783777236938477, 0.026641845703125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 2.0, 7.0, 7.0, 8.0, 11.0, 25.0, 45.0, 45.0, 75.0, 145.0, 209.0, 378.0, 636.0, 1246.0, 2442.0, 5443.0, 15545.0, 64130.0, 647123.0, 3251388.0, 160626.0, 28559.0, 8787.0, 3543.0, 1714.0, 903.0, 470.0, 273.0, 181.0, 100.0, 73.0, 45.0, 29.0, 24.0, 9.0, 8.0, 10.0, 5.0, 10.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.031280517578125, -0.030392885208129883, -0.029505252838134766, -0.02861762046813965, -0.02772998809814453, -0.026842355728149414, -0.025954723358154297, -0.02506709098815918, -0.024179458618164062, -0.023291826248168945, -0.022404193878173828, -0.02151656150817871, -0.020628929138183594, -0.019741296768188477, -0.01885366439819336, -0.017966032028198242, -0.017078399658203125, -0.016190767288208008, -0.01530313491821289, -0.014415502548217773, -0.013527870178222656, -0.012640237808227539, -0.011752605438232422, -0.010864973068237305, -0.009977340698242188, -0.00908970832824707, -0.008202075958251953, -0.007314443588256836, -0.006426811218261719, -0.0055391788482666016, -0.004651546478271484, -0.003763914108276367, -0.00287628173828125, -0.001988649368286133, -0.0011010169982910156, -0.00021338462829589844, 0.0006742477416992188, 0.001561880111694336, 0.002449512481689453, 0.0033371448516845703, 0.0042247772216796875, 0.005112409591674805, 0.006000041961669922, 0.006887674331665039, 0.007775306701660156, 0.008662939071655273, 0.00955057144165039, 0.010438203811645508, 0.011325836181640625, 0.012213468551635742, 0.01310110092163086, 0.013988733291625977, 0.014876365661621094, 0.01576399803161621, 0.016651630401611328, 0.017539262771606445, 0.018426895141601562, 0.01931452751159668, 0.020202159881591797, 0.021089792251586914, 0.02197742462158203, 0.02286505699157715, 0.023752689361572266, 0.024640321731567383, 0.0255279541015625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 3.0, 4.0, 2.0, 11.0, 17.0, 19.0, 36.0, 43.0, 66.0, 112.0, 240.0, 487.0, 1177.0, 960.0, 401.0, 175.0, 104.0, 67.0, 47.0, 29.0, 17.0, 18.0, 5.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0269927978515625, -0.026195526123046875, -0.02539825439453125, -0.024600982666015625, -0.0238037109375, -0.023006439208984375, -0.02220916748046875, -0.021411895751953125, -0.0206146240234375, -0.019817352294921875, -0.01902008056640625, -0.018222808837890625, -0.017425537109375, -0.016628265380859375, -0.01583099365234375, -0.015033721923828125, -0.0142364501953125, -0.013439178466796875, -0.01264190673828125, -0.011844635009765625, -0.01104736328125, -0.010250091552734375, -0.00945281982421875, -0.008655548095703125, -0.0078582763671875, -0.007061004638671875, -0.00626373291015625, -0.005466461181640625, -0.004669189453125, -0.003871917724609375, -0.00307464599609375, -0.002277374267578125, -0.0014801025390625, -0.000682830810546875, 0.00011444091796875, 0.000911712646484375, 0.001708984375, 0.002506256103515625, 0.00330352783203125, 0.004100799560546875, 0.0048980712890625, 0.005695343017578125, 0.00649261474609375, 0.007289886474609375, 0.008087158203125, 0.008884429931640625, 0.00968170166015625, 0.010478973388671875, 0.0112762451171875, 0.012073516845703125, 0.01287078857421875, 0.013668060302734375, 0.01446533203125, 0.015262603759765625, 0.01605987548828125, 0.016857147216796875, 0.0176544189453125, 0.018451690673828125, 0.01924896240234375, 0.020046234130859375, 0.020843505859375, 0.021640777587890625, 0.02243804931640625, 0.023235321044921875, 0.0240325927734375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 8.0, 17.0, 45.0, 134.0, 288.0, 299.0, 130.0, 43.0, 32.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3527269959449768, -0.34388798475265503, -0.33504897356033325, -0.3262099623680115, -0.3173709511756897, -0.3085319399833679, -0.29969292879104614, -0.29085391759872437, -0.2820149064064026, -0.2731758952140808, -0.26433688402175903, -0.25549787282943726, -0.24665886163711548, -0.2378198504447937, -0.22898082435131073, -0.22014181315898895, -0.21130278706550598, -0.2024637758731842, -0.19362476468086243, -0.18478575348854065, -0.17594674229621887, -0.1671077311038971, -0.15826870501041412, -0.14942969381809235, -0.14059068262577057, -0.1317516714334488, -0.12291266024112701, -0.11407364159822464, -0.10523463040590286, -0.09639561921358109, -0.08755660057067871, -0.07871758937835693, -0.06987857818603516, -0.06103956699371338, -0.0522005520761013, -0.04336153715848923, -0.03452252596616745, -0.025683514773845673, -0.016844499856233597, -0.008005484938621521, 0.0008335262537002563, 0.009672539308667183, 0.01851155236363411, 0.027350565418601036, 0.03618957847356796, 0.04502858966588974, 0.053867604583501816, 0.06270661950111389, 0.07154563069343567, 0.08038464188575745, 0.08922365307807922, 0.0980626717209816, 0.10690168291330338, 0.11574069410562515, 0.12457971274852753, 0.1334187239408493, 0.14225773513317108, 0.15109674632549286, 0.15993575751781464, 0.1687747687101364, 0.17761379480361938, 0.18645280599594116, 0.19529181718826294, 0.20413082838058472, 0.2129698395729065]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 5.0, 8.0, 8.0, 13.0, 15.0, 13.0, 18.0, 27.0, 28.0, 39.0, 41.0, 54.0, 57.0, 52.0, 52.0, 54.0, 68.0, 36.0, 44.0, 48.0, 49.0, 42.0, 42.0, 43.0, 28.0, 20.0, 22.0, 19.0, 12.0, 16.0, 7.0, 5.0, 5.0, 6.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.08969593048095703, -0.08738823235034943, -0.08508054167032242, -0.08277285099029541, -0.0804651528596878, -0.0781574547290802, -0.07584976404905319, -0.07354207336902618, -0.07123437523841858, -0.06892667710781097, -0.06661898642778397, -0.06431129574775696, -0.06200359761714935, -0.059695903211832047, -0.05738820880651474, -0.055080514401197433, -0.05277281999588013, -0.05046512559056282, -0.048157431185245514, -0.04584973677992821, -0.0435420423746109, -0.041234347969293594, -0.03892665356397629, -0.03661895915865898, -0.034311264753341675, -0.03200357034802437, -0.029695875942707062, -0.027388181537389755, -0.02508048713207245, -0.022772792726755142, -0.020465098321437836, -0.01815740391612053, -0.015849709510803223, -0.013542015105485916, -0.01123432070016861, -0.008926626294851303, -0.006618931889533997, -0.00431123748421669, -0.0020035430788993835, 0.000304151326417923, 0.0026118457317352295, 0.004919540137052536, 0.0072272345423698425, 0.009534928947687149, 0.011842623353004456, 0.014150317758321762, 0.01645801216363907, 0.018765706568956375, 0.02107340097427368, 0.023381095379590988, 0.025688789784908295, 0.0279964841902256, 0.030304178595542908, 0.032611873000860214, 0.03491956740617752, 0.03722726181149483, 0.039534956216812134, 0.04184265062212944, 0.04415034502744675, 0.04645803943276405, 0.04876573383808136, 0.051073428243398666, 0.05338112264871597, 0.05568881705403328, 0.057996511459350586]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 10.0, 5.0, 6.0, 9.0, 17.0, 19.0, 28.0, 60.0, 60.0, 84.0, 143.0, 191.0, 315.0, 459.0, 758.0, 1419.0, 3369.0, 10570.0, 51964.0, 366807.0, 509723.0, 79783.0, 14543.0, 4180.0, 1654.0, 861.0, 498.0, 304.0, 228.0, 153.0, 87.0, 75.0, 40.0, 34.0, 28.0, 26.0, 10.0, 11.0, 8.0, 5.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.06146240234375, -0.05971193313598633, -0.057961463928222656, -0.056210994720458984, -0.05446052551269531, -0.05271005630493164, -0.05095958709716797, -0.0492091178894043, -0.047458648681640625, -0.04570817947387695, -0.04395771026611328, -0.04220724105834961, -0.04045677185058594, -0.038706302642822266, -0.036955833435058594, -0.03520536422729492, -0.03345489501953125, -0.03170442581176758, -0.029953956604003906, -0.028203487396240234, -0.026453018188476562, -0.02470254898071289, -0.02295207977294922, -0.021201610565185547, -0.019451141357421875, -0.017700672149658203, -0.01595020294189453, -0.01419973373413086, -0.012449264526367188, -0.010698795318603516, -0.008948326110839844, -0.007197856903076172, -0.0054473876953125, -0.003696918487548828, -0.0019464492797851562, -0.00019598007202148438, 0.0015544891357421875, 0.0033049583435058594, 0.005055427551269531, 0.006805896759033203, 0.008556365966796875, 0.010306835174560547, 0.012057304382324219, 0.01380777359008789, 0.015558242797851562, 0.017308712005615234, 0.019059181213378906, 0.020809650421142578, 0.02256011962890625, 0.024310588836669922, 0.026061058044433594, 0.027811527252197266, 0.029561996459960938, 0.03131246566772461, 0.03306293487548828, 0.03481340408325195, 0.036563873291015625, 0.0383143424987793, 0.04006481170654297, 0.04181528091430664, 0.04356575012207031, 0.045316219329833984, 0.047066688537597656, 0.04881715774536133, 0.050567626953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 5.0, 13.0, 31.0, 56.0, 98.0, 120.0, 145.0, 133.0, 132.0, 99.0, 69.0, 53.0, 24.0, 12.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0270843505859375, -0.026269912719726562, -0.025455474853515625, -0.024641036987304688, -0.02382659912109375, -0.023012161254882812, -0.022197723388671875, -0.021383285522460938, -0.02056884765625, -0.019754409790039062, -0.018939971923828125, -0.018125534057617188, -0.01731109619140625, -0.016496658325195312, -0.015682220458984375, -0.014867782592773438, -0.0140533447265625, -0.013238906860351562, -0.012424468994140625, -0.011610031127929688, -0.01079559326171875, -0.009981155395507812, -0.009166717529296875, -0.008352279663085938, -0.007537841796875, -0.0067234039306640625, -0.005908966064453125, -0.0050945281982421875, -0.00428009033203125, -0.0034656524658203125, -0.002651214599609375, -0.0018367767333984375, -0.0010223388671875, -0.0002079010009765625, 0.000606536865234375, 0.0014209747314453125, 0.00223541259765625, 0.0030498504638671875, 0.003864288330078125, 0.0046787261962890625, 0.0054931640625, 0.0063076019287109375, 0.007122039794921875, 0.007936477661132812, 0.00875091552734375, 0.009565353393554688, 0.010379791259765625, 0.011194229125976562, 0.0120086669921875, 0.012823104858398438, 0.013637542724609375, 0.014451980590820312, 0.01526641845703125, 0.016080856323242188, 0.016895294189453125, 0.017709732055664062, 0.018524169921875, 0.019338607788085938, 0.020153045654296875, 0.020967483520507812, 0.02178192138671875, 0.022596359252929688, 0.023410797119140625, 0.024225234985351562, 0.0250396728515625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 6.0, 10.0, 16.0, 36.0, 25.0, 59.0, 69.0, 156.0, 242.0, 385.0, 711.0, 1270.0, 2469.0, 5126.0, 11225.0, 26599.0, 68009.0, 188620.0, 391175.0, 219380.0, 78299.0, 30159.0, 12790.0, 5767.0, 2656.0, 1453.0, 806.0, 404.0, 228.0, 142.0, 88.0, 61.0, 39.0, 26.0, 17.0, 8.0, 10.0, 7.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.03533935546875, -0.03437304496765137, -0.033406734466552734, -0.0324404239654541, -0.03147411346435547, -0.030507802963256836, -0.029541492462158203, -0.02857518196105957, -0.027608871459960938, -0.026642560958862305, -0.025676250457763672, -0.02470993995666504, -0.023743629455566406, -0.022777318954467773, -0.02181100845336914, -0.020844697952270508, -0.019878387451171875, -0.018912076950073242, -0.01794576644897461, -0.016979455947875977, -0.016013145446777344, -0.015046834945678711, -0.014080524444580078, -0.013114213943481445, -0.012147903442382812, -0.01118159294128418, -0.010215282440185547, -0.009248971939086914, -0.008282661437988281, -0.0073163509368896484, -0.006350040435791016, -0.005383729934692383, -0.00441741943359375, -0.003451108932495117, -0.0024847984313964844, -0.0015184879302978516, -0.0005521774291992188, 0.00041413307189941406, 0.0013804435729980469, 0.0023467540740966797, 0.0033130645751953125, 0.004279375076293945, 0.005245685577392578, 0.006211996078491211, 0.007178306579589844, 0.008144617080688477, 0.00911092758178711, 0.010077238082885742, 0.011043548583984375, 0.012009859085083008, 0.01297616958618164, 0.013942480087280273, 0.014908790588378906, 0.01587510108947754, 0.016841411590576172, 0.017807722091674805, 0.018774032592773438, 0.01974034309387207, 0.020706653594970703, 0.021672964096069336, 0.02263927459716797, 0.0236055850982666, 0.024571895599365234, 0.025538206100463867, 0.0265045166015625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 6.0, 8.0, 8.0, 15.0, 12.0, 19.0, 19.0, 24.0, 35.0, 33.0, 27.0, 53.0, 45.0, 57.0, 61.0, 65.0, 48.0, 43.0, 57.0, 54.0, 46.0, 50.0, 37.0, 28.0, 25.0, 31.0, 20.0, 17.0, 13.0, 8.0, 10.0, 6.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.04669189453125, -0.045441627502441406, -0.04419136047363281, -0.04294109344482422, -0.041690826416015625, -0.04044055938720703, -0.03919029235839844, -0.037940025329589844, -0.03668975830078125, -0.035439491271972656, -0.03418922424316406, -0.03293895721435547, -0.031688690185546875, -0.03043842315673828, -0.029188156127929688, -0.027937889099121094, -0.0266876220703125, -0.025437355041503906, -0.024187088012695312, -0.02293682098388672, -0.021686553955078125, -0.02043628692626953, -0.019186019897460938, -0.017935752868652344, -0.01668548583984375, -0.015435218811035156, -0.014184951782226562, -0.012934684753417969, -0.011684417724609375, -0.010434150695800781, -0.009183883666992188, -0.007933616638183594, -0.006683349609375, -0.005433082580566406, -0.0041828155517578125, -0.0029325485229492188, -0.001682281494140625, -0.00043201446533203125, 0.0008182525634765625, 0.0020685195922851562, 0.00331878662109375, 0.004569053649902344, 0.0058193206787109375, 0.007069587707519531, 0.008319854736328125, 0.009570121765136719, 0.010820388793945312, 0.012070655822753906, 0.0133209228515625, 0.014571189880371094, 0.015821456909179688, 0.01707172393798828, 0.018321990966796875, 0.01957225799560547, 0.020822525024414062, 0.022072792053222656, 0.02332305908203125, 0.024573326110839844, 0.025823593139648438, 0.02707386016845703, 0.028324127197265625, 0.02957439422607422, 0.030824661254882812, 0.032074928283691406, 0.0333251953125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 3.0, 5.0, 3.0, 5.0, 13.0, 10.0, 17.0, 28.0, 40.0, 49.0, 75.0, 92.0, 123.0, 187.0, 252.0, 315.0, 469.0, 654.0, 1039.0, 1602.0, 2650.0, 5588.0, 14508.0, 50214.0, 295682.0, 553092.0, 84140.0, 21041.0, 7535.0, 3470.0, 1841.0, 1147.0, 782.0, 545.0, 373.0, 274.0, 195.0, 147.0, 109.0, 66.0, 60.0, 40.0, 17.0, 23.0, 10.0, 13.0, 6.0, 9.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0231170654296875, -0.022296428680419922, -0.021475791931152344, -0.020655155181884766, -0.019834518432617188, -0.01901388168334961, -0.01819324493408203, -0.017372608184814453, -0.016551971435546875, -0.015731334686279297, -0.014910697937011719, -0.01409006118774414, -0.013269424438476562, -0.012448787689208984, -0.011628150939941406, -0.010807514190673828, -0.00998687744140625, -0.009166240692138672, -0.008345603942871094, -0.007524967193603516, -0.0067043304443359375, -0.005883693695068359, -0.005063056945800781, -0.004242420196533203, -0.003421783447265625, -0.002601146697998047, -0.0017805099487304688, -0.0009598731994628906, -0.0001392364501953125, 0.0006814002990722656, 0.0015020370483398438, 0.002322673797607422, 0.003143310546875, 0.003963947296142578, 0.004784584045410156, 0.005605220794677734, 0.0064258575439453125, 0.007246494293212891, 0.008067131042480469, 0.008887767791748047, 0.009708404541015625, 0.010529041290283203, 0.011349678039550781, 0.01217031478881836, 0.012990951538085938, 0.013811588287353516, 0.014632225036621094, 0.015452861785888672, 0.01627349853515625, 0.017094135284423828, 0.017914772033691406, 0.018735408782958984, 0.019556045532226562, 0.02037668228149414, 0.02119731903076172, 0.022017955780029297, 0.022838592529296875, 0.023659229278564453, 0.02447986602783203, 0.02530050277709961, 0.026121139526367188, 0.026941776275634766, 0.027762413024902344, 0.028583049774169922, 0.0294036865234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 1.0, 3.0, 3.0, 8.0, 6.0, 7.0, 10.0, 8.0, 15.0, 20.0, 20.0, 31.0, 26.0, 32.0, 49.0, 66.0, 68.0, 78.0, 90.0, 100.0, 71.0, 53.0, 50.0, 44.0, 31.0, 13.0, 23.0, 19.0, 16.0, 8.0, 6.0, 5.0, 1.0, 6.0, 6.0, 3.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.710124969482422e-05, -5.514174699783325e-05, -5.3182244300842285e-05, -5.122274160385132e-05, -4.926323890686035e-05, -4.7303736209869385e-05, -4.534423351287842e-05, -4.338473081588745e-05, -4.1425228118896484e-05, -3.946572542190552e-05, -3.750622272491455e-05, -3.5546720027923584e-05, -3.358721733093262e-05, -3.162771463394165e-05, -2.9668211936950684e-05, -2.7708709239959717e-05, -2.574920654296875e-05, -2.3789703845977783e-05, -2.1830201148986816e-05, -1.987069845199585e-05, -1.7911195755004883e-05, -1.5951693058013916e-05, -1.399219036102295e-05, -1.2032687664031982e-05, -1.0073184967041016e-05, -8.113682270050049e-06, -6.154179573059082e-06, -4.194676876068115e-06, -2.2351741790771484e-06, -2.7567148208618164e-07, 1.6838312149047852e-06, 3.643333911895752e-06, 5.602836608886719e-06, 7.5623393058776855e-06, 9.521842002868652e-06, 1.1481344699859619e-05, 1.3440847396850586e-05, 1.5400350093841553e-05, 1.735985279083252e-05, 1.9319355487823486e-05, 2.1278858184814453e-05, 2.323836088180542e-05, 2.5197863578796387e-05, 2.7157366275787354e-05, 2.911686897277832e-05, 3.107637166976929e-05, 3.3035874366760254e-05, 3.499537706375122e-05, 3.695487976074219e-05, 3.8914382457733154e-05, 4.087388515472412e-05, 4.283338785171509e-05, 4.4792890548706055e-05, 4.675239324569702e-05, 4.871189594268799e-05, 5.0671398639678955e-05, 5.263090133666992e-05, 5.459040403366089e-05, 5.6549906730651855e-05, 5.850940942764282e-05, 6.046891212463379e-05, 6.242841482162476e-05, 6.438791751861572e-05, 6.634742021560669e-05, 6.830692291259766e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 6.0, 2.0, 8.0, 7.0, 14.0, 8.0, 30.0, 28.0, 51.0, 60.0, 134.0, 161.0, 297.0, 434.0, 896.0, 1630.0, 3514.0, 8265.0, 25757.0, 102341.0, 533220.0, 288703.0, 56140.0, 15749.0, 5603.0, 2590.0, 1230.0, 650.0, 363.0, 217.0, 141.0, 107.0, 75.0, 45.0, 25.0, 16.0, 15.0, 7.0, 10.0, 7.0, 0.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02154541015625, -0.02086782455444336, -0.02019023895263672, -0.019512653350830078, -0.018835067749023438, -0.018157482147216797, -0.017479896545410156, -0.016802310943603516, -0.016124725341796875, -0.015447139739990234, -0.014769554138183594, -0.014091968536376953, -0.013414382934570312, -0.012736797332763672, -0.012059211730957031, -0.01138162612915039, -0.01070404052734375, -0.01002645492553711, -0.009348869323730469, -0.008671283721923828, -0.007993698120117188, -0.007316112518310547, -0.006638526916503906, -0.005960941314697266, -0.005283355712890625, -0.004605770111083984, -0.003928184509277344, -0.003250598907470703, -0.0025730133056640625, -0.0018954277038574219, -0.0012178421020507812, -0.0005402565002441406, 0.0001373291015625, 0.0008149147033691406, 0.0014925003051757812, 0.002170085906982422, 0.0028476715087890625, 0.003525257110595703, 0.004202842712402344, 0.004880428314208984, 0.005558013916015625, 0.006235599517822266, 0.006913185119628906, 0.007590770721435547, 0.008268356323242188, 0.008945941925048828, 0.009623527526855469, 0.01030111312866211, 0.01097869873046875, 0.01165628433227539, 0.012333869934082031, 0.013011455535888672, 0.013689041137695312, 0.014366626739501953, 0.015044212341308594, 0.015721797943115234, 0.016399383544921875, 0.017076969146728516, 0.017754554748535156, 0.018432140350341797, 0.019109725952148438, 0.019787311553955078, 0.02046489715576172, 0.02114248275756836, 0.021820068359375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 18.0, 11.0, 31.0, 32.0, 54.0, 83.0, 178.0, 185.0, 150.0, 92.0, 44.0, 29.0, 16.0, 16.0, 16.0, 6.0, 10.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.022369384765625, -0.02149057388305664, -0.02061176300048828, -0.019732952117919922, -0.018854141235351562, -0.017975330352783203, -0.017096519470214844, -0.016217708587646484, -0.015338897705078125, -0.014460086822509766, -0.013581275939941406, -0.012702465057373047, -0.011823654174804688, -0.010944843292236328, -0.010066032409667969, -0.00918722152709961, -0.00830841064453125, -0.007429599761962891, -0.006550788879394531, -0.005671977996826172, -0.0047931671142578125, -0.003914356231689453, -0.0030355453491210938, -0.0021567344665527344, -0.001277923583984375, -0.0003991127014160156, 0.00047969818115234375, 0.0013585090637207031, 0.0022373199462890625, 0.003116130828857422, 0.003994941711425781, 0.004873752593994141, 0.0057525634765625, 0.006631374359130859, 0.007510185241699219, 0.008388996124267578, 0.009267807006835938, 0.010146617889404297, 0.011025428771972656, 0.011904239654541016, 0.012783050537109375, 0.013661861419677734, 0.014540672302246094, 0.015419483184814453, 0.016298294067382812, 0.017177104949951172, 0.01805591583251953, 0.01893472671508789, 0.01981353759765625, 0.02069234848022461, 0.02157115936279297, 0.022449970245361328, 0.023328781127929688, 0.024207592010498047, 0.025086402893066406, 0.025965213775634766, 0.026844024658203125, 0.027722835540771484, 0.028601646423339844, 0.029480457305908203, 0.030359268188476562, 0.031238079071044922, 0.03211688995361328, 0.03299570083618164, 0.03387451171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 4.0, 7.0, 17.0, 23.0, 29.0, 70.0, 87.0, 136.0, 124.0, 103.0, 113.0, 78.0, 67.0, 39.0, 26.0, 15.0, 11.0, 11.0, 7.0, 7.0, 6.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.20814645290374756, -0.20171432197093964, -0.19528217613697052, -0.1888500452041626, -0.18241789937019348, -0.17598576843738556, -0.16955362260341644, -0.16312149167060852, -0.1566893458366394, -0.15025721490383148, -0.14382506906986237, -0.13739293813705444, -0.13096079230308533, -0.1245286613702774, -0.11809651553630829, -0.11166438460350037, -0.10523224622011185, -0.09880010783672333, -0.09236796945333481, -0.08593583106994629, -0.07950369268655777, -0.07307155430316925, -0.06663942337036133, -0.06020728126168251, -0.05377514287829399, -0.04734300449490547, -0.04091086611151695, -0.03447873145341873, -0.028046591207385063, -0.021614454686641693, -0.015182316303253174, -0.008750177919864655, -0.0023180395364761353, 0.004114098381251097, 0.010546236298978329, 0.016978373751044273, 0.023410512134432793, 0.029842648655176163, 0.03627478703856468, 0.0427069254219532, 0.04913906380534172, 0.05557120218873024, 0.06200334057211876, 0.06843547523021698, 0.0748676136136055, 0.08129975199699402, 0.08773189038038254, 0.09416402876377106, 0.10059616714715958, 0.1070283055305481, 0.11346044391393661, 0.11989258229732513, 0.12632471323013306, 0.13275685906410217, 0.1391889899969101, 0.1456211358308792, 0.15205326676368713, 0.15848539769649506, 0.16491754353046417, 0.1713496744632721, 0.1777818202972412, 0.18421395123004913, 0.19064609706401825, 0.19707822799682617, 0.2035103738307953]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 3.0, 6.0, 7.0, 7.0, 14.0, 17.0, 6.0, 12.0, 20.0, 15.0, 16.0, 17.0, 22.0, 27.0, 29.0, 31.0, 37.0, 29.0, 32.0, 27.0, 26.0, 28.0, 41.0, 52.0, 36.0, 33.0, 44.0, 41.0, 36.0, 30.0, 31.0, 26.0, 37.0, 23.0, 16.0, 18.0, 14.0, 13.0, 19.0, 10.0, 13.0, 12.0, 4.0, 10.0, 8.0, 3.0, 0.0, 4.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0795784592628479, -0.07692801207304001, -0.07427756488323212, -0.07162711769342422, -0.06897667050361633, -0.06632623076438904, -0.06367578357458115, -0.061025336384773254, -0.05837488919496536, -0.05572444200515747, -0.05307399481534958, -0.050423551350831985, -0.047773104161024094, -0.0451226569712162, -0.04247221350669861, -0.03982176631689072, -0.037171319127082825, -0.03452087193727493, -0.03187042474746704, -0.029219981282949448, -0.026569534093141556, -0.023919086903333664, -0.02126864157617092, -0.01861819624900818, -0.015967749059200287, -0.01331730280071497, -0.010666856542229652, -0.008016410283744335, -0.005365964025259018, -0.0027155177667737007, -6.507150828838348e-05, 0.002585373818874359, 0.005235821008682251, 0.007886267267167568, 0.010536713525652885, 0.013187159784138203, 0.01583760604262352, 0.018488053232431412, 0.021138498559594154, 0.023788943886756897, 0.02643939107656479, 0.02908983826637268, 0.03174028545618057, 0.034390728920698166, 0.03704117611050606, 0.03969162330031395, 0.04234206676483154, 0.044992513954639435, 0.04764296114444733, 0.05029340833425522, 0.05294385552406311, 0.055594298988580704, 0.058244746178388596, 0.06089519336819649, 0.06354563683271408, 0.06619608402252197, 0.06884653121232986, 0.07149697840213776, 0.07414742559194565, 0.07679787278175354, 0.07944831252098083, 0.08209875971078873, 0.08474920690059662, 0.08739965409040451, 0.0900501012802124]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 6.0, 18.0, 23.0, 46.0, 143.0, 449.0, 2142.0, 19848.0, 1727072.0, 2417803.0, 23559.0, 2468.0, 466.0, 142.0, 50.0, 30.0, 8.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0667724609375, -0.06475067138671875, -0.0627288818359375, -0.06070709228515625, -0.058685302734375, -0.05666351318359375, -0.0546417236328125, -0.05261993408203125, -0.05059814453125, -0.04857635498046875, -0.0465545654296875, -0.04453277587890625, -0.042510986328125, -0.04048919677734375, -0.0384674072265625, -0.03644561767578125, -0.034423828125, -0.03240203857421875, -0.0303802490234375, -0.02835845947265625, -0.026336669921875, -0.02431488037109375, -0.0222930908203125, -0.02027130126953125, -0.01824951171875, -0.01622772216796875, -0.0142059326171875, -0.01218414306640625, -0.010162353515625, -0.00814056396484375, -0.0061187744140625, -0.00409698486328125, -0.0020751953125, -5.340576171875e-05, 0.0019683837890625, 0.00399017333984375, 0.006011962890625, 0.00803375244140625, 0.0100555419921875, 0.01207733154296875, 0.01409912109375, 0.01612091064453125, 0.0181427001953125, 0.02016448974609375, 0.022186279296875, 0.02420806884765625, 0.0262298583984375, 0.02825164794921875, 0.0302734375, 0.03229522705078125, 0.0343170166015625, 0.03633880615234375, 0.038360595703125, 0.04038238525390625, 0.0424041748046875, 0.04442596435546875, 0.04644775390625, 0.04846954345703125, 0.0504913330078125, 0.05251312255859375, 0.054534912109375, 0.05655670166015625, 0.0585784912109375, 0.06060028076171875, 0.0626220703125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 7.0, 11.0, 13.0, 31.0, 57.0, 70.0, 110.0, 120.0, 135.0, 123.0, 113.0, 82.0, 64.0, 32.0, 17.0, 13.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.028228759765625, -0.027362823486328125, -0.02649688720703125, -0.025630950927734375, -0.0247650146484375, -0.023899078369140625, -0.02303314208984375, -0.022167205810546875, -0.02130126953125, -0.020435333251953125, -0.01956939697265625, -0.018703460693359375, -0.0178375244140625, -0.016971588134765625, -0.01610565185546875, -0.015239715576171875, -0.014373779296875, -0.013507843017578125, -0.01264190673828125, -0.011775970458984375, -0.0109100341796875, -0.010044097900390625, -0.00917816162109375, -0.008312225341796875, -0.0074462890625, -0.006580352783203125, -0.00571441650390625, -0.004848480224609375, -0.0039825439453125, -0.003116607666015625, -0.00225067138671875, -0.001384735107421875, -0.000518798828125, 0.000347137451171875, 0.00121307373046875, 0.002079010009765625, 0.0029449462890625, 0.003810882568359375, 0.00467681884765625, 0.005542755126953125, 0.00640869140625, 0.007274627685546875, 0.00814056396484375, 0.009006500244140625, 0.0098724365234375, 0.010738372802734375, 0.01160430908203125, 0.012470245361328125, 0.013336181640625, 0.014202117919921875, 0.01506805419921875, 0.015933990478515625, 0.0167999267578125, 0.017665863037109375, 0.01853179931640625, 0.019397735595703125, 0.020263671875, 0.021129608154296875, 0.02199554443359375, 0.022861480712890625, 0.0237274169921875, 0.024593353271484375, 0.02545928955078125, 0.026325225830078125, 0.027191162109375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 7.0, 8.0, 7.0, 16.0, 29.0, 36.0, 43.0, 83.0, 116.0, 199.0, 337.0, 561.0, 990.0, 1851.0, 3918.0, 9570.0, 27620.0, 111859.0, 1695859.0, 2168860.0, 123908.0, 29705.0, 10101.0, 4099.0, 1925.0, 1043.0, 558.0, 357.0, 209.0, 126.0, 85.0, 61.0, 42.0, 33.0, 14.0, 8.0, 8.0, 9.0, 6.0, 2.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0], "bins": [-0.033416748046875, -0.03237342834472656, -0.031330108642578125, -0.030286788940429688, -0.02924346923828125, -0.028200149536132812, -0.027156829833984375, -0.026113510131835938, -0.0250701904296875, -0.024026870727539062, -0.022983551025390625, -0.021940231323242188, -0.02089691162109375, -0.019853591918945312, -0.018810272216796875, -0.017766952514648438, -0.0167236328125, -0.015680313110351562, -0.014636993408203125, -0.013593673706054688, -0.01255035400390625, -0.011507034301757812, -0.010463714599609375, -0.009420394897460938, -0.0083770751953125, -0.0073337554931640625, -0.006290435791015625, -0.0052471160888671875, -0.00420379638671875, -0.0031604766845703125, -0.002117156982421875, -0.0010738372802734375, -3.0517578125e-05, 0.0010128021240234375, 0.002056121826171875, 0.0030994415283203125, 0.00414276123046875, 0.0051860809326171875, 0.006229400634765625, 0.0072727203369140625, 0.0083160400390625, 0.009359359741210938, 0.010402679443359375, 0.011445999145507812, 0.01248931884765625, 0.013532638549804688, 0.014575958251953125, 0.015619277954101562, 0.01666259765625, 0.017705917358398438, 0.018749237060546875, 0.019792556762695312, 0.02083587646484375, 0.021879196166992188, 0.022922515869140625, 0.023965835571289062, 0.0250091552734375, 0.026052474975585938, 0.027095794677734375, 0.028139114379882812, 0.02918243408203125, 0.030225753784179688, 0.031269073486328125, 0.03231239318847656, 0.033355712890625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 8.0, 15.0, 14.0, 22.0, 30.0, 39.0, 56.0, 98.0, 146.0, 220.0, 506.0, 1075.0, 881.0, 389.0, 223.0, 106.0, 56.0, 45.0, 40.0, 18.0, 23.0, 13.0, 9.0, 8.0, 6.0, 4.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0259246826171875, -0.02499556541442871, -0.024066448211669922, -0.023137331008911133, -0.022208213806152344, -0.021279096603393555, -0.020349979400634766, -0.019420862197875977, -0.018491744995117188, -0.0175626277923584, -0.01663351058959961, -0.01570439338684082, -0.014775276184082031, -0.013846158981323242, -0.012917041778564453, -0.011987924575805664, -0.011058807373046875, -0.010129690170288086, -0.009200572967529297, -0.008271455764770508, -0.007342338562011719, -0.00641322135925293, -0.005484104156494141, -0.0045549869537353516, -0.0036258697509765625, -0.0026967525482177734, -0.0017676353454589844, -0.0008385181427001953, 9.059906005859375e-05, 0.0010197162628173828, 0.0019488334655761719, 0.002877950668334961, 0.00380706787109375, 0.004736185073852539, 0.005665302276611328, 0.006594419479370117, 0.007523536682128906, 0.008452653884887695, 0.009381771087646484, 0.010310888290405273, 0.011240005493164062, 0.012169122695922852, 0.01309823989868164, 0.01402735710144043, 0.014956474304199219, 0.015885591506958008, 0.016814708709716797, 0.017743825912475586, 0.018672943115234375, 0.019602060317993164, 0.020531177520751953, 0.021460294723510742, 0.02238941192626953, 0.02331852912902832, 0.02424764633178711, 0.0251767635345459, 0.026105880737304688, 0.027034997940063477, 0.027964115142822266, 0.028893232345581055, 0.029822349548339844, 0.030751466751098633, 0.03168058395385742, 0.03260970115661621, 0.033538818359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 18.0, 48.0, 142.0, 330.0, 281.0, 100.0, 46.0, 18.0, 6.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43314528465270996, -0.41948965191841125, -0.40583401918411255, -0.39217838644981384, -0.37852275371551514, -0.36486712098121643, -0.3512114882469177, -0.337555855512619, -0.3239002227783203, -0.3102445900440216, -0.2965889573097229, -0.2829333245754242, -0.2692776918411255, -0.2556220591068268, -0.24196642637252808, -0.22831079363822937, -0.21465517580509186, -0.20099954307079315, -0.18734391033649445, -0.17368827760219574, -0.16003264486789703, -0.14637702703475952, -0.13272139430046082, -0.11906575411558151, -0.1054101213812828, -0.0917544886469841, -0.0780988559126854, -0.06444323062896729, -0.05078759416937828, -0.03713196516036987, -0.023476332426071167, -0.009820699691772461, 0.003834933042526245, 0.01749056577682495, 0.031146196648478508, 0.044801827520132065, 0.05845746025443077, 0.07211308926343918, 0.08576872199773788, 0.09942435473203659, 0.1130799874663353, 0.1267356127500534, 0.1403912454843521, 0.15404687821865082, 0.16770251095294952, 0.18135814368724823, 0.19501377642154694, 0.20866940915584564, 0.22232504189014435, 0.23598067462444305, 0.24963630735874176, 0.2632919251918793, 0.276947557926178, 0.2906031906604767, 0.3042588233947754, 0.3179144561290741, 0.3315700888633728, 0.3452257215976715, 0.3588813543319702, 0.3725369870662689, 0.3861926198005676, 0.39984825253486633, 0.41350388526916504, 0.42715951800346375, 0.44081515073776245]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 8.0, 9.0, 12.0, 16.0, 17.0, 19.0, 38.0, 36.0, 33.0, 47.0, 56.0, 61.0, 41.0, 38.0, 58.0, 56.0, 53.0, 64.0, 48.0, 36.0, 41.0, 37.0, 40.0, 26.0, 28.0, 28.0, 17.0, 13.0, 7.0, 8.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11802500486373901, -0.11464447528123856, -0.1112639456987381, -0.10788341611623764, -0.10450288653373718, -0.10112236440181732, -0.09774183481931686, -0.0943613052368164, -0.09098077565431595, -0.08760024607181549, -0.08421971648931503, -0.08083918690681458, -0.07745866477489471, -0.07407812774181366, -0.0706976056098938, -0.06731707602739334, -0.06393654644489288, -0.060556016862392426, -0.05717548727989197, -0.05379496142268181, -0.05041443184018135, -0.04703390225768089, -0.043653376400470734, -0.040272846817970276, -0.03689231723546982, -0.03351178765296936, -0.030131259933114052, -0.026750732213258743, -0.023370202630758286, -0.019989673048257828, -0.01660914532840252, -0.01322861760854721, -0.009848088026046753, -0.00646755937486887, -0.0030870307236909866, 0.0002934979274868965, 0.0036740265786647797, 0.007054556161165237, 0.010435083881020546, 0.013815611600875854, 0.017196141183376312, 0.02057667076587677, 0.02395719848573208, 0.027337726205587387, 0.030718255788087845, 0.0340987853705883, 0.03747931122779846, 0.04085984081029892, 0.04424037039279938, 0.047620899975299835, 0.05100142955780029, 0.05438195541501045, 0.05776248499751091, 0.06114301458001137, 0.06452354043722153, 0.06790407001972198, 0.07128459960222244, 0.0746651291847229, 0.07804565876722336, 0.08142618834972382, 0.08480671048164368, 0.08818724751472473, 0.09156776964664459, 0.09494829922914505, 0.09832882881164551]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 6.0, 14.0, 11.0, 17.0, 19.0, 29.0, 40.0, 54.0, 94.0, 130.0, 176.0, 275.0, 478.0, 868.0, 2044.0, 5358.0, 18223.0, 78592.0, 359351.0, 439352.0, 107723.0, 24082.0, 6744.0, 2405.0, 1008.0, 552.0, 316.0, 171.0, 111.0, 92.0, 56.0, 55.0, 23.0, 26.0, 15.0, 19.0, 6.0, 9.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.06866455078125, -0.0666508674621582, -0.0646371841430664, -0.06262350082397461, -0.06060981750488281, -0.058596134185791016, -0.05658245086669922, -0.05456876754760742, -0.052555084228515625, -0.05054140090942383, -0.04852771759033203, -0.046514034271240234, -0.04450035095214844, -0.04248666763305664, -0.040472984313964844, -0.03845930099487305, -0.03644561767578125, -0.03443193435668945, -0.032418251037597656, -0.03040456771850586, -0.028390884399414062, -0.026377201080322266, -0.02436351776123047, -0.022349834442138672, -0.020336151123046875, -0.018322467803955078, -0.01630878448486328, -0.014295101165771484, -0.012281417846679688, -0.01026773452758789, -0.008254051208496094, -0.006240367889404297, -0.0042266845703125, -0.002213001251220703, -0.00019931793212890625, 0.0018143653869628906, 0.0038280487060546875, 0.005841732025146484, 0.007855415344238281, 0.009869098663330078, 0.011882781982421875, 0.013896465301513672, 0.01591014862060547, 0.017923831939697266, 0.019937515258789062, 0.02195119857788086, 0.023964881896972656, 0.025978565216064453, 0.02799224853515625, 0.030005931854248047, 0.032019615173339844, 0.03403329849243164, 0.03604698181152344, 0.038060665130615234, 0.04007434844970703, 0.04208803176879883, 0.044101715087890625, 0.04611539840698242, 0.04812908172607422, 0.050142765045166016, 0.05215644836425781, 0.05417013168334961, 0.056183815002441406, 0.0581974983215332, 0.060211181640625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 7.0, 14.0, 16.0, 30.0, 42.0, 80.0, 87.0, 111.0, 132.0, 116.0, 91.0, 79.0, 75.0, 43.0, 31.0, 25.0, 17.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0297393798828125, -0.028888225555419922, -0.028037071228027344, -0.027185916900634766, -0.026334762573242188, -0.02548360824584961, -0.02463245391845703, -0.023781299591064453, -0.022930145263671875, -0.022078990936279297, -0.02122783660888672, -0.02037668228149414, -0.019525527954101562, -0.018674373626708984, -0.017823219299316406, -0.016972064971923828, -0.01612091064453125, -0.015269756317138672, -0.014418601989746094, -0.013567447662353516, -0.012716293334960938, -0.01186513900756836, -0.011013984680175781, -0.010162830352783203, -0.009311676025390625, -0.008460521697998047, -0.007609367370605469, -0.006758213043212891, -0.0059070587158203125, -0.005055904388427734, -0.004204750061035156, -0.003353595733642578, -0.00250244140625, -0.0016512870788574219, -0.0008001327514648438, 5.1021575927734375e-05, 0.0009021759033203125, 0.0017533302307128906, 0.0026044845581054688, 0.003455638885498047, 0.004306793212890625, 0.005157947540283203, 0.006009101867675781, 0.006860256195068359, 0.0077114105224609375, 0.008562564849853516, 0.009413719177246094, 0.010264873504638672, 0.01111602783203125, 0.011967182159423828, 0.012818336486816406, 0.013669490814208984, 0.014520645141601562, 0.01537179946899414, 0.01622295379638672, 0.017074108123779297, 0.017925262451171875, 0.018776416778564453, 0.01962757110595703, 0.02047872543334961, 0.021329879760742188, 0.022181034088134766, 0.023032188415527344, 0.023883342742919922, 0.0247344970703125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 8.0, 17.0, 16.0, 37.0, 59.0, 113.0, 191.0, 422.0, 852.0, 2223.0, 5994.0, 19420.0, 70924.0, 276770.0, 464305.0, 150406.0, 39130.0, 11174.0, 3801.0, 1454.0, 589.0, 305.0, 143.0, 71.0, 47.0, 33.0, 14.0, 12.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059234619140625, -0.05734062194824219, -0.055446624755859375, -0.05355262756347656, -0.05165863037109375, -0.04976463317871094, -0.047870635986328125, -0.04597663879394531, -0.0440826416015625, -0.04218864440917969, -0.040294647216796875, -0.03840065002441406, -0.03650665283203125, -0.03461265563964844, -0.032718658447265625, -0.030824661254882812, -0.0289306640625, -0.027036666870117188, -0.025142669677734375, -0.023248672485351562, -0.02135467529296875, -0.019460678100585938, -0.017566680908203125, -0.015672683715820312, -0.0137786865234375, -0.011884689331054688, -0.009990692138671875, -0.008096694946289062, -0.00620269775390625, -0.0043087005615234375, -0.002414703369140625, -0.0005207061767578125, 0.001373291015625, 0.0032672882080078125, 0.005161285400390625, 0.0070552825927734375, 0.00894927978515625, 0.010843276977539062, 0.012737274169921875, 0.014631271362304688, 0.0165252685546875, 0.018419265747070312, 0.020313262939453125, 0.022207260131835938, 0.02410125732421875, 0.025995254516601562, 0.027889251708984375, 0.029783248901367188, 0.03167724609375, 0.03357124328613281, 0.035465240478515625, 0.03735923767089844, 0.03925323486328125, 0.04114723205566406, 0.043041229248046875, 0.04493522644042969, 0.0468292236328125, 0.04872322082519531, 0.050617218017578125, 0.05251121520996094, 0.05440521240234375, 0.05629920959472656, 0.058193206787109375, 0.06008720397949219, 0.061981201171875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 9.0, 10.0, 14.0, 14.0, 13.0, 12.0, 25.0, 27.0, 46.0, 42.0, 58.0, 47.0, 47.0, 56.0, 47.0, 48.0, 57.0, 51.0, 55.0, 41.0, 36.0, 56.0, 32.0, 29.0, 13.0, 11.0, 14.0, 15.0, 15.0, 9.0, 11.0, 8.0, 3.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.04876708984375, -0.04725074768066406, -0.045734405517578125, -0.04421806335449219, -0.04270172119140625, -0.04118537902832031, -0.039669036865234375, -0.03815269470214844, -0.0366363525390625, -0.03512001037597656, -0.033603668212890625, -0.03208732604980469, -0.03057098388671875, -0.029054641723632812, -0.027538299560546875, -0.026021957397460938, -0.024505615234375, -0.022989273071289062, -0.021472930908203125, -0.019956588745117188, -0.01844024658203125, -0.016923904418945312, -0.015407562255859375, -0.013891220092773438, -0.0123748779296875, -0.010858535766601562, -0.009342193603515625, -0.007825851440429688, -0.00630950927734375, -0.0047931671142578125, -0.003276824951171875, -0.0017604827880859375, -0.000244140625, 0.0012722015380859375, 0.002788543701171875, 0.0043048858642578125, 0.00582122802734375, 0.0073375701904296875, 0.008853912353515625, 0.010370254516601562, 0.0118865966796875, 0.013402938842773438, 0.014919281005859375, 0.016435623168945312, 0.01795196533203125, 0.019468307495117188, 0.020984649658203125, 0.022500991821289062, 0.024017333984375, 0.025533676147460938, 0.027050018310546875, 0.028566360473632812, 0.03008270263671875, 0.03159904479980469, 0.033115386962890625, 0.03463172912597656, 0.0361480712890625, 0.03766441345214844, 0.039180755615234375, 0.04069709777832031, 0.04221343994140625, 0.04372978210449219, 0.045246124267578125, 0.04676246643066406, 0.04827880859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 9.0, 2.0, 9.0, 3.0, 17.0, 18.0, 19.0, 29.0, 52.0, 75.0, 147.0, 198.0, 357.0, 621.0, 980.0, 1716.0, 3132.0, 5579.0, 10417.0, 20778.0, 44232.0, 109161.0, 307042.0, 331008.0, 118925.0, 47485.0, 21831.0, 11066.0, 5892.0, 3199.0, 1793.0, 1045.0, 636.0, 424.0, 259.0, 138.0, 87.0, 59.0, 39.0, 26.0, 13.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.02197265625, -0.021363019943237305, -0.02075338363647461, -0.020143747329711914, -0.01953411102294922, -0.018924474716186523, -0.018314838409423828, -0.017705202102661133, -0.017095565795898438, -0.016485929489135742, -0.015876293182373047, -0.015266656875610352, -0.014657020568847656, -0.014047384262084961, -0.013437747955322266, -0.01282811164855957, -0.012218475341796875, -0.01160883903503418, -0.010999202728271484, -0.010389566421508789, -0.009779930114746094, -0.009170293807983398, -0.008560657501220703, -0.007951021194458008, -0.0073413848876953125, -0.006731748580932617, -0.006122112274169922, -0.0055124759674072266, -0.004902839660644531, -0.004293203353881836, -0.0036835670471191406, -0.0030739307403564453, -0.00246429443359375, -0.0018546581268310547, -0.0012450218200683594, -0.0006353855133056641, -2.574920654296875e-05, 0.0005838871002197266, 0.0011935234069824219, 0.0018031597137451172, 0.0024127960205078125, 0.003022432327270508, 0.003632068634033203, 0.0042417049407958984, 0.004851341247558594, 0.005460977554321289, 0.006070613861083984, 0.00668025016784668, 0.007289886474609375, 0.00789952278137207, 0.008509159088134766, 0.009118795394897461, 0.009728431701660156, 0.010338068008422852, 0.010947704315185547, 0.011557340621948242, 0.012166976928710938, 0.012776613235473633, 0.013386249542236328, 0.013995885848999023, 0.014605522155761719, 0.015215158462524414, 0.01582479476928711, 0.016434431076049805, 0.0170440673828125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 7.0, 10.0, 8.0, 20.0, 15.0, 20.0, 29.0, 33.0, 25.0, 52.0, 50.0, 68.0, 90.0, 69.0, 77.0, 72.0, 57.0, 54.0, 56.0, 42.0, 21.0, 33.0, 16.0, 23.0, 15.0, 15.0, 7.0, 7.0, 8.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.716085433959961e-05, -5.5344775319099426e-05, -5.352869629859924e-05, -5.171261727809906e-05, -4.989653825759888e-05, -4.8080459237098694e-05, -4.626438021659851e-05, -4.444830119609833e-05, -4.2632222175598145e-05, -4.081614315509796e-05, -3.900006413459778e-05, -3.7183985114097595e-05, -3.536790609359741e-05, -3.355182707309723e-05, -3.1735748052597046e-05, -2.9919669032096863e-05, -2.810359001159668e-05, -2.6287510991096497e-05, -2.4471431970596313e-05, -2.265535295009613e-05, -2.0839273929595947e-05, -1.9023194909095764e-05, -1.720711588859558e-05, -1.5391036868095398e-05, -1.3574957847595215e-05, -1.1758878827095032e-05, -9.942799806594849e-06, -8.126720786094666e-06, -6.310641765594482e-06, -4.494562745094299e-06, -2.678483724594116e-06, -8.624047040939331e-07, 9.5367431640625e-07, 2.769753336906433e-06, 4.585832357406616e-06, 6.401911377906799e-06, 8.217990398406982e-06, 1.0034069418907166e-05, 1.1850148439407349e-05, 1.3666227459907532e-05, 1.5482306480407715e-05, 1.7298385500907898e-05, 1.911446452140808e-05, 2.0930543541908264e-05, 2.2746622562408447e-05, 2.456270158290863e-05, 2.6378780603408813e-05, 2.8194859623908997e-05, 3.001093864440918e-05, 3.182701766490936e-05, 3.3643096685409546e-05, 3.545917570590973e-05, 3.727525472640991e-05, 3.9091333746910095e-05, 4.090741276741028e-05, 4.272349178791046e-05, 4.4539570808410645e-05, 4.635564982891083e-05, 4.817172884941101e-05, 4.9987807869911194e-05, 5.180388689041138e-05, 5.361996591091156e-05, 5.543604493141174e-05, 5.7252123951911926e-05, 5.906820297241211e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 3.0, 7.0, 14.0, 10.0, 25.0, 28.0, 35.0, 95.0, 181.0, 285.0, 611.0, 1250.0, 2870.0, 6960.0, 17448.0, 49284.0, 189296.0, 524992.0, 178867.0, 47147.0, 16904.0, 6743.0, 2945.0, 1267.0, 616.0, 292.0, 167.0, 81.0, 42.0, 43.0, 15.0, 11.0, 5.0, 4.0, 7.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02667236328125, -0.025797367095947266, -0.02492237091064453, -0.024047374725341797, -0.023172378540039062, -0.022297382354736328, -0.021422386169433594, -0.02054738998413086, -0.019672393798828125, -0.01879739761352539, -0.017922401428222656, -0.017047405242919922, -0.016172409057617188, -0.015297412872314453, -0.014422416687011719, -0.013547420501708984, -0.01267242431640625, -0.011797428131103516, -0.010922431945800781, -0.010047435760498047, -0.009172439575195312, -0.008297443389892578, -0.007422447204589844, -0.006547451019287109, -0.005672454833984375, -0.004797458648681641, -0.003922462463378906, -0.003047466278076172, -0.0021724700927734375, -0.0012974739074707031, -0.00042247772216796875, 0.0004525184631347656, 0.0013275146484375, 0.0022025108337402344, 0.0030775070190429688, 0.003952503204345703, 0.0048274993896484375, 0.005702495574951172, 0.006577491760253906, 0.007452487945556641, 0.008327484130859375, 0.00920248031616211, 0.010077476501464844, 0.010952472686767578, 0.011827468872070312, 0.012702465057373047, 0.013577461242675781, 0.014452457427978516, 0.01532745361328125, 0.016202449798583984, 0.01707744598388672, 0.017952442169189453, 0.018827438354492188, 0.019702434539794922, 0.020577430725097656, 0.02145242691040039, 0.022327423095703125, 0.02320241928100586, 0.024077415466308594, 0.024952411651611328, 0.025827407836914062, 0.026702404022216797, 0.02757740020751953, 0.028452396392822266, 0.029327392578125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 6.0, 2.0, 4.0, 2.0, 9.0, 5.0, 12.0, 11.0, 15.0, 14.0, 22.0, 23.0, 32.0, 38.0, 50.0, 69.0, 88.0, 134.0, 102.0, 85.0, 71.0, 62.0, 36.0, 20.0, 33.0, 10.0, 11.0, 12.0, 4.0, 10.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.025238037109375, -0.024384021759033203, -0.023530006408691406, -0.02267599105834961, -0.021821975708007812, -0.020967960357666016, -0.02011394500732422, -0.019259929656982422, -0.018405914306640625, -0.017551898956298828, -0.01669788360595703, -0.015843868255615234, -0.014989852905273438, -0.01413583755493164, -0.013281822204589844, -0.012427806854248047, -0.01157379150390625, -0.010719776153564453, -0.009865760803222656, -0.00901174545288086, -0.008157730102539062, -0.007303714752197266, -0.006449699401855469, -0.005595684051513672, -0.004741668701171875, -0.003887653350830078, -0.0030336380004882812, -0.0021796226501464844, -0.0013256072998046875, -0.0004715919494628906, 0.00038242340087890625, 0.0012364387512207031, 0.0020904541015625, 0.002944469451904297, 0.0037984848022460938, 0.004652500152587891, 0.0055065155029296875, 0.006360530853271484, 0.007214546203613281, 0.008068561553955078, 0.008922576904296875, 0.009776592254638672, 0.010630607604980469, 0.011484622955322266, 0.012338638305664062, 0.01319265365600586, 0.014046669006347656, 0.014900684356689453, 0.01575469970703125, 0.016608715057373047, 0.017462730407714844, 0.01831674575805664, 0.019170761108398438, 0.020024776458740234, 0.02087879180908203, 0.021732807159423828, 0.022586822509765625, 0.023440837860107422, 0.02429485321044922, 0.025148868560791016, 0.026002883911132812, 0.02685689926147461, 0.027710914611816406, 0.028564929962158203, 0.0294189453125]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 5.0, 7.0, 14.0, 12.0, 24.0, 40.0, 55.0, 72.0, 74.0, 90.0, 110.0, 86.0, 101.0, 82.0, 66.0, 48.0, 30.0, 22.0, 20.0, 15.0, 5.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2896897792816162, -0.28223860263824463, -0.27478742599487305, -0.2673362195491791, -0.2598850429058075, -0.2524338662624359, -0.24498268961906433, -0.23753151297569275, -0.23008032143115997, -0.2226291447877884, -0.21517795324325562, -0.20772677659988403, -0.20027559995651245, -0.19282440841197968, -0.1853732317686081, -0.17792204022407532, -0.17047086358070374, -0.16301968693733215, -0.15556849539279938, -0.1481173187494278, -0.14066612720489502, -0.13321495056152344, -0.12576377391815186, -0.11831258982419968, -0.1108614057302475, -0.10341022163629532, -0.09595903754234314, -0.08850786089897156, -0.08105667680501938, -0.0736054927110672, -0.06615431606769562, -0.05870313197374344, -0.051251962780952454, -0.043800778687000275, -0.036349598318338394, -0.028898416087031364, -0.021447233855724335, -0.013996049761772156, -0.006544869393110275, 0.0009063109755516052, 0.008357495069503784, 0.015808677300810814, 0.023259859532117844, 0.030711041763424873, 0.0381622239947319, 0.04561340808868408, 0.05306458845734596, 0.06051576882600784, 0.06796695291996002, 0.0754181370139122, 0.08286932110786438, 0.09032049775123596, 0.09777168184518814, 0.10522286593914032, 0.1126740425825119, 0.12012522667646408, 0.12757641077041626, 0.13502758741378784, 0.14247877895832062, 0.1499299556016922, 0.15738114714622498, 0.16483232378959656, 0.17228350043296814, 0.17973467707633972, 0.1871858686208725]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 2.0, 14.0, 13.0, 19.0, 8.0, 21.0, 25.0, 23.0, 21.0, 23.0, 24.0, 40.0, 30.0, 27.0, 43.0, 45.0, 57.0, 53.0, 51.0, 44.0, 34.0, 51.0, 49.0, 34.0, 46.0, 28.0, 24.0, 19.0, 24.0, 16.0, 12.0, 12.0, 13.0, 14.0, 6.0, 9.0, 9.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12698519229888916, -0.1231943741440773, -0.11940354853868484, -0.11561273038387299, -0.11182190477848053, -0.10803108662366867, -0.10424026846885681, -0.10044944286346436, -0.0966586247086525, -0.09286780655384064, -0.08907698094844818, -0.08528616279363632, -0.08149534463882446, -0.077704519033432, -0.07391370087862015, -0.07012288272380829, -0.06633205711841583, -0.06254123896360397, -0.05875041335821152, -0.05495959520339966, -0.0511687733232975, -0.04737795144319534, -0.043587133288383484, -0.039796311408281326, -0.03600548952817917, -0.03221466764807701, -0.028423847630620003, -0.024633027613162994, -0.020842205733060837, -0.01705138385295868, -0.01326056383550167, -0.009469743818044662, -0.005678921937942505, -0.001888100989162922, 0.001902719959616661, 0.005693540908396244, 0.009484361857175827, 0.013275183737277985, 0.017066003754734993, 0.020856823772192, 0.02464764565229416, 0.028438467532396317, 0.032229289412498474, 0.03602010756731033, 0.03981092944741249, 0.04360175132751465, 0.04739256948232651, 0.051183391362428665, 0.05497421324253082, 0.05876503512263298, 0.06255585700273514, 0.066346675157547, 0.07013750076293945, 0.07392831891775131, 0.07771913707256317, 0.08150996267795563, 0.08530078083276749, 0.08909159898757935, 0.0928824245929718, 0.09667324274778366, 0.10046406090259552, 0.10425488650798798, 0.10804570466279984, 0.1118365228176117, 0.11562734842300415]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 11.0, 10.0, 22.0, 31.0, 56.0, 124.0, 292.0, 701.0, 2261.0, 7585.0, 31930.0, 279712.0, 3441317.0, 378832.0, 38905.0, 8709.0, 2338.0, 831.0, 307.0, 145.0, 68.0, 35.0, 19.0, 14.0, 5.0, 4.0, 10.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037445068359375, -0.036034584045410156, -0.03462409973144531, -0.03321361541748047, -0.031803131103515625, -0.03039264678955078, -0.028982162475585938, -0.027571678161621094, -0.02616119384765625, -0.024750709533691406, -0.023340225219726562, -0.02192974090576172, -0.020519256591796875, -0.01910877227783203, -0.017698287963867188, -0.016287803649902344, -0.0148773193359375, -0.013466835021972656, -0.012056350708007812, -0.010645866394042969, -0.009235382080078125, -0.007824897766113281, -0.0064144134521484375, -0.005003929138183594, -0.00359344482421875, -0.0021829605102539062, -0.0007724761962890625, 0.0006380081176757812, 0.002048492431640625, 0.0034589767456054688, 0.0048694610595703125, 0.006279945373535156, 0.0076904296875, 0.009100914001464844, 0.010511398315429688, 0.011921882629394531, 0.013332366943359375, 0.014742851257324219, 0.016153335571289062, 0.017563819885253906, 0.01897430419921875, 0.020384788513183594, 0.021795272827148438, 0.02320575714111328, 0.024616241455078125, 0.02602672576904297, 0.027437210083007812, 0.028847694396972656, 0.0302581787109375, 0.031668663024902344, 0.03307914733886719, 0.03448963165283203, 0.035900115966796875, 0.03731060028076172, 0.03872108459472656, 0.040131568908691406, 0.04154205322265625, 0.042952537536621094, 0.04436302185058594, 0.04577350616455078, 0.047183990478515625, 0.04859447479248047, 0.05000495910644531, 0.051415443420410156, 0.052825927734375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 12.0, 8.0, 24.0, 29.0, 56.0, 55.0, 76.0, 112.0, 129.0, 119.0, 90.0, 95.0, 71.0, 39.0, 33.0, 23.0, 19.0, 11.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.029052734375, -0.028144121170043945, -0.02723550796508789, -0.026326894760131836, -0.02541828155517578, -0.024509668350219727, -0.023601055145263672, -0.022692441940307617, -0.021783828735351562, -0.020875215530395508, -0.019966602325439453, -0.0190579891204834, -0.018149375915527344, -0.01724076271057129, -0.016332149505615234, -0.01542353630065918, -0.014514923095703125, -0.01360630989074707, -0.012697696685791016, -0.011789083480834961, -0.010880470275878906, -0.009971857070922852, -0.009063243865966797, -0.008154630661010742, -0.0072460174560546875, -0.006337404251098633, -0.005428791046142578, -0.0045201778411865234, -0.0036115646362304688, -0.002702951431274414, -0.0017943382263183594, -0.0008857250213623047, 2.288818359375e-05, 0.0009315013885498047, 0.0018401145935058594, 0.002748727798461914, 0.0036573410034179688, 0.0045659542083740234, 0.005474567413330078, 0.006383180618286133, 0.0072917938232421875, 0.008200407028198242, 0.009109020233154297, 0.010017633438110352, 0.010926246643066406, 0.011834859848022461, 0.012743473052978516, 0.01365208625793457, 0.014560699462890625, 0.01546931266784668, 0.016377925872802734, 0.01728653907775879, 0.018195152282714844, 0.0191037654876709, 0.020012378692626953, 0.020920991897583008, 0.021829605102539062, 0.022738218307495117, 0.023646831512451172, 0.024555444717407227, 0.02546405792236328, 0.026372671127319336, 0.02728128433227539, 0.028189897537231445, 0.0290985107421875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 6.0, 11.0, 12.0, 27.0, 39.0, 57.0, 71.0, 98.0, 183.0, 341.0, 550.0, 1068.0, 2339.0, 6351.0, 21319.0, 104694.0, 2157398.0, 1772821.0, 96394.0, 19820.0, 5961.0, 2292.0, 1032.0, 548.0, 310.0, 201.0, 121.0, 91.0, 38.0, 44.0, 19.0, 15.0, 7.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05352783203125, -0.05190467834472656, -0.050281524658203125, -0.04865837097167969, -0.04703521728515625, -0.04541206359863281, -0.043788909912109375, -0.04216575622558594, -0.0405426025390625, -0.03891944885253906, -0.037296295166015625, -0.03567314147949219, -0.03404998779296875, -0.03242683410644531, -0.030803680419921875, -0.029180526733398438, -0.027557373046875, -0.025934219360351562, -0.024311065673828125, -0.022687911987304688, -0.02106475830078125, -0.019441604614257812, -0.017818450927734375, -0.016195297241210938, -0.0145721435546875, -0.012948989868164062, -0.011325836181640625, -0.009702682495117188, -0.00807952880859375, -0.0064563751220703125, -0.004833221435546875, -0.0032100677490234375, -0.0015869140625, 3.62396240234375e-05, 0.001659393310546875, 0.0032825469970703125, 0.00490570068359375, 0.0065288543701171875, 0.008152008056640625, 0.009775161743164062, 0.0113983154296875, 0.013021469116210938, 0.014644622802734375, 0.016267776489257812, 0.01789093017578125, 0.019514083862304688, 0.021137237548828125, 0.022760391235351562, 0.024383544921875, 0.026006698608398438, 0.027629852294921875, 0.029253005981445312, 0.03087615966796875, 0.03249931335449219, 0.034122467041015625, 0.03574562072753906, 0.0373687744140625, 0.03899192810058594, 0.040615081787109375, 0.04223823547363281, 0.04386138916015625, 0.04548454284667969, 0.047107696533203125, 0.04873085021972656, 0.05035400390625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 5.0, 2.0, 5.0, 1.0, 8.0, 4.0, 6.0, 6.0, 14.0, 15.0, 19.0, 36.0, 37.0, 58.0, 89.0, 129.0, 202.0, 399.0, 834.0, 887.0, 547.0, 235.0, 179.0, 98.0, 68.0, 53.0, 45.0, 20.0, 21.0, 13.0, 13.0, 11.0, 10.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0252227783203125, -0.024083852767944336, -0.022944927215576172, -0.021806001663208008, -0.020667076110839844, -0.01952815055847168, -0.018389225006103516, -0.01725029945373535, -0.016111373901367188, -0.014972448348999023, -0.01383352279663086, -0.012694597244262695, -0.011555671691894531, -0.010416746139526367, -0.009277820587158203, -0.008138895034790039, -0.006999969482421875, -0.005861043930053711, -0.004722118377685547, -0.003583192825317383, -0.0024442672729492188, -0.0013053417205810547, -0.00016641616821289062, 0.0009725093841552734, 0.0021114349365234375, 0.0032503604888916016, 0.004389286041259766, 0.00552821159362793, 0.006667137145996094, 0.007806062698364258, 0.008944988250732422, 0.010083913803100586, 0.01122283935546875, 0.012361764907836914, 0.013500690460205078, 0.014639616012573242, 0.015778541564941406, 0.01691746711730957, 0.018056392669677734, 0.0191953182220459, 0.020334243774414062, 0.021473169326782227, 0.02261209487915039, 0.023751020431518555, 0.02488994598388672, 0.026028871536254883, 0.027167797088623047, 0.02830672264099121, 0.029445648193359375, 0.03058457374572754, 0.0317234992980957, 0.03286242485046387, 0.03400135040283203, 0.035140275955200195, 0.03627920150756836, 0.03741812705993652, 0.03855705261230469, 0.03969597816467285, 0.040834903717041016, 0.04197382926940918, 0.043112754821777344, 0.04425168037414551, 0.04539060592651367, 0.046529531478881836, 0.04766845703125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 6.0, 11.0, 13.0, 39.0, 86.0, 142.0, 222.0, 218.0, 124.0, 57.0, 37.0, 20.0, 15.0, 5.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.5880122184753418, -0.5751349329948425, -0.5622576475143433, -0.549380362033844, -0.5365030765533447, -0.5236257910728455, -0.5107485055923462, -0.4978712499141693, -0.48499396443367004, -0.4721166789531708, -0.4592393934726715, -0.44636210799217224, -0.43348485231399536, -0.4206075668334961, -0.4077302813529968, -0.39485299587249756, -0.3819757103919983, -0.369098424911499, -0.35622113943099976, -0.3433438539505005, -0.3304665684700012, -0.31758928298950195, -0.3047120273113251, -0.2918347418308258, -0.27895745635032654, -0.26608017086982727, -0.253202885389328, -0.24032561480998993, -0.22744832932949066, -0.2145710438489914, -0.20169377326965332, -0.18881648778915405, -0.17593920230865479, -0.16306191682815552, -0.15018463134765625, -0.13730736076831818, -0.12443007528781891, -0.11155278980731964, -0.09867551177740097, -0.0857982337474823, -0.07292094826698303, -0.06004366651177406, -0.047166384756565094, -0.034289103001356125, -0.021411821246147156, -0.008534535765647888, 0.0043427422642707825, 0.017220020294189453, 0.03009730577468872, 0.04297458752989769, 0.05585186928510666, 0.06872914731502533, 0.0816064327955246, 0.09448371827602386, 0.10736099630594254, 0.1202382743358612, 0.13311555981636047, 0.14599284529685974, 0.158870130777359, 0.17174740135669708, 0.18462468683719635, 0.19750197231769562, 0.2103792428970337, 0.22325652837753296, 0.23613381385803223]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 2.0, 2.0, 6.0, 8.0, 6.0, 12.0, 12.0, 18.0, 18.0, 24.0, 20.0, 32.0, 35.0, 30.0, 37.0, 44.0, 32.0, 47.0, 39.0, 46.0, 47.0, 49.0, 39.0, 55.0, 44.0, 38.0, 37.0, 30.0, 23.0, 25.0, 27.0, 26.0, 20.0, 13.0, 13.0, 5.0, 11.0, 7.0, 5.0, 6.0, 4.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.14956510066986084, -0.1455327719449997, -0.14150044322013855, -0.1374681144952774, -0.13343578577041626, -0.12940345704555511, -0.12537112832069397, -0.12133880704641342, -0.11730647832155228, -0.11327414959669113, -0.10924182087182999, -0.10520949214696884, -0.1011771708726883, -0.09714484214782715, -0.093112513422966, -0.08908018469810486, -0.08504785597324371, -0.08101552724838257, -0.07698319852352142, -0.07295086979866028, -0.06891854107379913, -0.06488621234893799, -0.06085389107465744, -0.056821562349796295, -0.05278923362493515, -0.048756904900074005, -0.04472457617521286, -0.040692251175642014, -0.03665992245078087, -0.032627593725919724, -0.028595266863703728, -0.024562940001487732, -0.020530611276626587, -0.016498282551765442, -0.012465955689549446, -0.008433627896010876, -0.004401300102472305, -0.0003689713776111603, 0.0036633554846048355, 0.007695682346820831, 0.011728011071681976, 0.01576033979654312, 0.019792666658759117, 0.023824993520975113, 0.027857322245836258, 0.0318896509706974, 0.03592197597026825, 0.039954304695129395, 0.04398663341999054, 0.048018962144851685, 0.05205129086971283, 0.056083615869283676, 0.06011594459414482, 0.06414827704429626, 0.06818059831857681, 0.07221292704343796, 0.0762452557682991, 0.08027758449316025, 0.08430991321802139, 0.08834224194288254, 0.09237456321716309, 0.09640689194202423, 0.10043922066688538, 0.10447154939174652, 0.10850387811660767]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 6.0, 16.0, 15.0, 17.0, 21.0, 34.0, 43.0, 56.0, 82.0, 140.0, 189.0, 312.0, 566.0, 1001.0, 1900.0, 4430.0, 10986.0, 29467.0, 81418.0, 214833.0, 350994.0, 217962.0, 83789.0, 30119.0, 11163.0, 4460.0, 2006.0, 967.0, 600.0, 325.0, 210.0, 136.0, 82.0, 60.0, 45.0, 34.0, 22.0, 23.0, 10.0, 10.0, 3.0, 5.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037994384765625, -0.03670692443847656, -0.035419464111328125, -0.03413200378417969, -0.03284454345703125, -0.03155708312988281, -0.030269622802734375, -0.028982162475585938, -0.0276947021484375, -0.026407241821289062, -0.025119781494140625, -0.023832321166992188, -0.02254486083984375, -0.021257400512695312, -0.019969940185546875, -0.018682479858398438, -0.01739501953125, -0.016107559204101562, -0.014820098876953125, -0.013532638549804688, -0.01224517822265625, -0.010957717895507812, -0.009670257568359375, -0.008382797241210938, -0.0070953369140625, -0.0058078765869140625, -0.004520416259765625, -0.0032329559326171875, -0.00194549560546875, -0.0006580352783203125, 0.000629425048828125, 0.0019168853759765625, 0.003204345703125, 0.0044918060302734375, 0.005779266357421875, 0.0070667266845703125, 0.00835418701171875, 0.009641647338867188, 0.010929107666015625, 0.012216567993164062, 0.0135040283203125, 0.014791488647460938, 0.016078948974609375, 0.017366409301757812, 0.01865386962890625, 0.019941329956054688, 0.021228790283203125, 0.022516250610351562, 0.0238037109375, 0.025091171264648438, 0.026378631591796875, 0.027666091918945312, 0.02895355224609375, 0.030241012573242188, 0.031528472900390625, 0.03281593322753906, 0.0341033935546875, 0.03539085388183594, 0.036678314208984375, 0.03796577453613281, 0.03925323486328125, 0.04054069519042969, 0.041828155517578125, 0.04311561584472656, 0.044403076171875]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 3.0, 13.0, 26.0, 22.0, 32.0, 36.0, 53.0, 57.0, 72.0, 87.0, 100.0, 87.0, 85.0, 73.0, 83.0, 51.0, 37.0, 23.0, 15.0, 17.0, 16.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0300140380859375, -0.029153108596801758, -0.028292179107666016, -0.027431249618530273, -0.02657032012939453, -0.02570939064025879, -0.024848461151123047, -0.023987531661987305, -0.023126602172851562, -0.02226567268371582, -0.021404743194580078, -0.020543813705444336, -0.019682884216308594, -0.01882195472717285, -0.01796102523803711, -0.017100095748901367, -0.016239166259765625, -0.015378236770629883, -0.01451730728149414, -0.013656377792358398, -0.012795448303222656, -0.011934518814086914, -0.011073589324951172, -0.01021265983581543, -0.009351730346679688, -0.008490800857543945, -0.007629871368408203, -0.006768941879272461, -0.005908012390136719, -0.0050470829010009766, -0.004186153411865234, -0.003325223922729492, -0.00246429443359375, -0.0016033649444580078, -0.0007424354553222656, 0.00011849403381347656, 0.0009794235229492188, 0.001840353012084961, 0.002701282501220703, 0.0035622119903564453, 0.0044231414794921875, 0.00528407096862793, 0.006145000457763672, 0.007005929946899414, 0.007866859436035156, 0.008727788925170898, 0.00958871841430664, 0.010449647903442383, 0.011310577392578125, 0.012171506881713867, 0.01303243637084961, 0.013893365859985352, 0.014754295349121094, 0.015615224838256836, 0.016476154327392578, 0.01733708381652832, 0.018198013305664062, 0.019058942794799805, 0.019919872283935547, 0.02078080177307129, 0.02164173126220703, 0.022502660751342773, 0.023363590240478516, 0.024224519729614258, 0.02508544921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 8.0, 7.0, 16.0, 18.0, 29.0, 47.0, 64.0, 129.0, 199.0, 315.0, 644.0, 1079.0, 2238.0, 4488.0, 9439.0, 20743.0, 47411.0, 112622.0, 251870.0, 310085.0, 163223.0, 69088.0, 29462.0, 12920.0, 6053.0, 2906.0, 1515.0, 815.0, 454.0, 247.0, 147.0, 83.0, 61.0, 38.0, 21.0, 23.0, 8.0, 9.0, 6.0, 5.0, 4.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.033050537109375, -0.03195667266845703, -0.030862808227539062, -0.029768943786621094, -0.028675079345703125, -0.027581214904785156, -0.026487350463867188, -0.02539348602294922, -0.02429962158203125, -0.02320575714111328, -0.022111892700195312, -0.021018028259277344, -0.019924163818359375, -0.018830299377441406, -0.017736434936523438, -0.01664257049560547, -0.0155487060546875, -0.014454841613769531, -0.013360977172851562, -0.012267112731933594, -0.011173248291015625, -0.010079383850097656, -0.008985519409179688, -0.007891654968261719, -0.00679779052734375, -0.005703926086425781, -0.0046100616455078125, -0.0035161972045898438, -0.002422332763671875, -0.0013284683227539062, -0.0002346038818359375, 0.0008592605590820312, 0.001953125, 0.0030469894409179688, 0.0041408538818359375, 0.005234718322753906, 0.006328582763671875, 0.007422447204589844, 0.008516311645507812, 0.009610176086425781, 0.01070404052734375, 0.011797904968261719, 0.012891769409179688, 0.013985633850097656, 0.015079498291015625, 0.016173362731933594, 0.017267227172851562, 0.01836109161376953, 0.0194549560546875, 0.02054882049560547, 0.021642684936523438, 0.022736549377441406, 0.023830413818359375, 0.024924278259277344, 0.026018142700195312, 0.02711200714111328, 0.02820587158203125, 0.02929973602294922, 0.030393600463867188, 0.031487464904785156, 0.032581329345703125, 0.033675193786621094, 0.03476905822753906, 0.03586292266845703, 0.036956787109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 6.0, 5.0, 2.0, 9.0, 17.0, 14.0, 7.0, 19.0, 17.0, 19.0, 30.0, 21.0, 33.0, 46.0, 26.0, 40.0, 45.0, 37.0, 55.0, 53.0, 40.0, 46.0, 41.0, 40.0, 30.0, 43.0, 29.0, 30.0, 25.0, 33.0, 26.0, 15.0, 21.0, 21.0, 10.0, 9.0, 4.0, 6.0, 8.0, 3.0, 3.0, 3.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.045989990234375, -0.044579505920410156, -0.04316902160644531, -0.04175853729248047, -0.040348052978515625, -0.03893756866455078, -0.03752708435058594, -0.036116600036621094, -0.03470611572265625, -0.033295631408691406, -0.03188514709472656, -0.03047466278076172, -0.029064178466796875, -0.02765369415283203, -0.026243209838867188, -0.024832725524902344, -0.0234222412109375, -0.022011756896972656, -0.020601272583007812, -0.01919078826904297, -0.017780303955078125, -0.01636981964111328, -0.014959335327148438, -0.013548851013183594, -0.01213836669921875, -0.010727882385253906, -0.009317398071289062, -0.007906913757324219, -0.006496429443359375, -0.005085945129394531, -0.0036754608154296875, -0.0022649765014648438, -0.0008544921875, 0.0005559921264648438, 0.0019664764404296875, 0.0033769607543945312, 0.004787445068359375, 0.006197929382324219, 0.0076084136962890625, 0.009018898010253906, 0.01042938232421875, 0.011839866638183594, 0.013250350952148438, 0.014660835266113281, 0.016071319580078125, 0.01748180389404297, 0.018892288208007812, 0.020302772521972656, 0.0217132568359375, 0.023123741149902344, 0.024534225463867188, 0.02594470977783203, 0.027355194091796875, 0.02876567840576172, 0.030176162719726562, 0.031586647033691406, 0.03299713134765625, 0.034407615661621094, 0.03581809997558594, 0.03722858428955078, 0.038639068603515625, 0.04004955291748047, 0.04146003723144531, 0.042870521545410156, 0.044281005859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 7.0, 7.0, 14.0, 29.0, 41.0, 56.0, 94.0, 159.0, 260.0, 462.0, 786.0, 1591.0, 3137.0, 6885.0, 17812.0, 66723.0, 545574.0, 336090.0, 44133.0, 13571.0, 5499.0, 2653.0, 1292.0, 685.0, 410.0, 226.0, 126.0, 91.0, 52.0, 39.0, 21.0, 8.0, 5.0, 6.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.026702880859375, -0.02583789825439453, -0.024972915649414062, -0.024107933044433594, -0.023242950439453125, -0.022377967834472656, -0.021512985229492188, -0.02064800262451172, -0.01978302001953125, -0.01891803741455078, -0.018053054809570312, -0.017188072204589844, -0.016323089599609375, -0.015458106994628906, -0.014593124389648438, -0.013728141784667969, -0.0128631591796875, -0.011998176574707031, -0.011133193969726562, -0.010268211364746094, -0.009403228759765625, -0.008538246154785156, -0.0076732635498046875, -0.006808280944824219, -0.00594329833984375, -0.005078315734863281, -0.0042133331298828125, -0.0033483505249023438, -0.002483367919921875, -0.0016183853149414062, -0.0007534027099609375, 0.00011157989501953125, 0.0009765625, 0.0018415451049804688, 0.0027065277099609375, 0.0035715103149414062, 0.004436492919921875, 0.005301475524902344, 0.0061664581298828125, 0.007031440734863281, 0.00789642333984375, 0.008761405944824219, 0.009626388549804688, 0.010491371154785156, 0.011356353759765625, 0.012221336364746094, 0.013086318969726562, 0.013951301574707031, 0.0148162841796875, 0.01568126678466797, 0.016546249389648438, 0.017411231994628906, 0.018276214599609375, 0.019141197204589844, 0.020006179809570312, 0.02087116241455078, 0.02173614501953125, 0.02260112762451172, 0.023466110229492188, 0.024331092834472656, 0.025196075439453125, 0.026061058044433594, 0.026926040649414062, 0.02779102325439453, 0.028656005859375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 14.0, 12.0, 12.0, 10.0, 19.0, 24.0, 25.0, 51.0, 48.0, 59.0, 76.0, 74.0, 92.0, 75.0, 66.0, 76.0, 52.0, 38.0, 32.0, 28.0, 26.0, 22.0, 14.0, 12.0, 5.0, 2.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.731250762939453e-05, -3.596208989620209e-05, -3.4611672163009644e-05, -3.32612544298172e-05, -3.1910836696624756e-05, -3.056041896343231e-05, -2.9210001230239868e-05, -2.7859583497047424e-05, -2.650916576385498e-05, -2.5158748030662537e-05, -2.3808330297470093e-05, -2.245791256427765e-05, -2.1107494831085205e-05, -1.975707709789276e-05, -1.8406659364700317e-05, -1.7056241631507874e-05, -1.570582389831543e-05, -1.4355406165122986e-05, -1.3004988431930542e-05, -1.1654570698738098e-05, -1.0304152965545654e-05, -8.95373523235321e-06, -7.603317499160767e-06, -6.252899765968323e-06, -4.902482032775879e-06, -3.552064299583435e-06, -2.201646566390991e-06, -8.512288331985474e-07, 4.991888999938965e-07, 1.8496066331863403e-06, 3.200024366378784e-06, 4.550442099571228e-06, 5.900859832763672e-06, 7.251277565956116e-06, 8.60169529914856e-06, 9.952113032341003e-06, 1.1302530765533447e-05, 1.2652948498725891e-05, 1.4003366231918335e-05, 1.535378396511078e-05, 1.6704201698303223e-05, 1.8054619431495667e-05, 1.940503716468811e-05, 2.0755454897880554e-05, 2.2105872631072998e-05, 2.3456290364265442e-05, 2.4806708097457886e-05, 2.615712583065033e-05, 2.7507543563842773e-05, 2.8857961297035217e-05, 3.020837903022766e-05, 3.1558796763420105e-05, 3.290921449661255e-05, 3.425963222980499e-05, 3.5610049962997437e-05, 3.696046769618988e-05, 3.8310885429382324e-05, 3.966130316257477e-05, 4.101172089576721e-05, 4.2362138628959656e-05, 4.37125563621521e-05, 4.5062974095344543e-05, 4.641339182853699e-05, 4.776380956172943e-05, 4.9114227294921875e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 5.0, 11.0, 15.0, 14.0, 20.0, 34.0, 29.0, 59.0, 77.0, 129.0, 180.0, 295.0, 540.0, 886.0, 1654.0, 3061.0, 5963.0, 13527.0, 40880.0, 228164.0, 582591.0, 122384.0, 27140.0, 10269.0, 4742.0, 2606.0, 1338.0, 729.0, 395.0, 282.0, 174.0, 117.0, 82.0, 48.0, 33.0, 24.0, 18.0, 14.0, 3.0, 11.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.024078369140625, -0.023377180099487305, -0.02267599105834961, -0.021974802017211914, -0.02127361297607422, -0.020572423934936523, -0.019871234893798828, -0.019170045852661133, -0.018468856811523438, -0.017767667770385742, -0.017066478729248047, -0.01636528968811035, -0.015664100646972656, -0.014962911605834961, -0.014261722564697266, -0.01356053352355957, -0.012859344482421875, -0.01215815544128418, -0.011456966400146484, -0.010755777359008789, -0.010054588317871094, -0.009353399276733398, -0.008652210235595703, -0.007951021194458008, -0.0072498321533203125, -0.006548643112182617, -0.005847454071044922, -0.0051462650299072266, -0.004445075988769531, -0.003743886947631836, -0.0030426979064941406, -0.0023415088653564453, -0.00164031982421875, -0.0009391307830810547, -0.00023794174194335938, 0.00046324729919433594, 0.0011644363403320312, 0.0018656253814697266, 0.002566814422607422, 0.003268003463745117, 0.0039691925048828125, 0.004670381546020508, 0.005371570587158203, 0.0060727596282958984, 0.006773948669433594, 0.007475137710571289, 0.008176326751708984, 0.00887751579284668, 0.009578704833984375, 0.01027989387512207, 0.010981082916259766, 0.011682271957397461, 0.012383460998535156, 0.013084650039672852, 0.013785839080810547, 0.014487028121948242, 0.015188217163085938, 0.015889406204223633, 0.016590595245361328, 0.017291784286499023, 0.01799297332763672, 0.018694162368774414, 0.01939535140991211, 0.020096540451049805, 0.0207977294921875]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 5.0, 3.0, 5.0, 9.0, 9.0, 17.0, 23.0, 24.0, 50.0, 57.0, 77.0, 127.0, 150.0, 144.0, 80.0, 58.0, 55.0, 43.0, 18.0, 13.0, 13.0, 3.0, 6.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0], "bins": [-0.0282135009765625, -0.027502775192260742, -0.026792049407958984, -0.026081323623657227, -0.02537059783935547, -0.02465987205505371, -0.023949146270751953, -0.023238420486450195, -0.022527694702148438, -0.02181696891784668, -0.021106243133544922, -0.020395517349243164, -0.019684791564941406, -0.01897406578063965, -0.01826333999633789, -0.017552614212036133, -0.016841888427734375, -0.016131162643432617, -0.01542043685913086, -0.014709711074829102, -0.013998985290527344, -0.013288259506225586, -0.012577533721923828, -0.01186680793762207, -0.011156082153320312, -0.010445356369018555, -0.009734630584716797, -0.009023904800415039, -0.008313179016113281, -0.0076024532318115234, -0.006891727447509766, -0.006181001663208008, -0.00547027587890625, -0.004759550094604492, -0.004048824310302734, -0.0033380985260009766, -0.0026273727416992188, -0.001916646957397461, -0.0012059211730957031, -0.0004951953887939453, 0.0002155303955078125, 0.0009262561798095703, 0.0016369819641113281, 0.002347707748413086, 0.0030584335327148438, 0.0037691593170166016, 0.004479885101318359, 0.005190610885620117, 0.005901336669921875, 0.006612062454223633, 0.007322788238525391, 0.008033514022827148, 0.008744239807128906, 0.009454965591430664, 0.010165691375732422, 0.01087641716003418, 0.011587142944335938, 0.012297868728637695, 0.013008594512939453, 0.013719320297241211, 0.014430046081542969, 0.015140771865844727, 0.015851497650146484, 0.016562223434448242, 0.01727294921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 14.0, 14.0, 20.0, 36.0, 60.0, 126.0, 145.0, 204.0, 177.0, 102.0, 45.0, 29.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5163941979408264, -0.5038917064666748, -0.4913892447948456, -0.47888678312301636, -0.46638432145118713, -0.4538818597793579, -0.4413793683052063, -0.4288769066333771, -0.41637444496154785, -0.40387198328971863, -0.391369491815567, -0.3788670301437378, -0.36636456847190857, -0.35386210680007935, -0.34135961532592773, -0.3288571536540985, -0.3163546919822693, -0.30385223031044006, -0.29134973883628845, -0.27884727716445923, -0.26634481549263, -0.2538423538208008, -0.24133986234664917, -0.22883740067481995, -0.21633490920066833, -0.20383243262767792, -0.1913299709558487, -0.17882749438285828, -0.16632503271102905, -0.15382255613803864, -0.14132007956504822, -0.128817617893219, -0.11631515622138977, -0.10381268709897995, -0.09131021797657013, -0.07880774140357971, -0.06630527973175049, -0.05380280315876007, -0.04130033403635025, -0.02879786491394043, -0.01629539579153061, -0.003792925737798214, 0.008709544315934181, 0.02121201530098915, 0.03371448442339897, 0.04621695727109909, 0.05871942639350891, 0.07122189551591873, 0.08372436463832855, 0.09622683376073837, 0.1087293028831482, 0.12123177945613861, 0.13373424112796783, 0.14623671770095825, 0.15873917937278748, 0.1712416559457779, 0.1837441325187683, 0.19624660909175873, 0.20874907076358795, 0.22125154733657837, 0.2337540090084076, 0.246256485581398, 0.2587589621543884, 0.27126142382621765, 0.2837638854980469]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 9.0, 13.0, 14.0, 17.0, 19.0, 27.0, 31.0, 25.0, 18.0, 27.0, 31.0, 44.0, 42.0, 39.0, 46.0, 42.0, 45.0, 43.0, 47.0, 47.0, 39.0, 42.0, 36.0, 40.0, 28.0, 26.0, 31.0, 26.0, 14.0, 11.0, 17.0, 11.0, 10.0, 13.0, 3.0, 9.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.14830946922302246, -0.14427319169044495, -0.14023689925670624, -0.13620062172412872, -0.13216432929039001, -0.1281280517578125, -0.12409176677465439, -0.12005548179149628, -0.11601919680833817, -0.11198291182518005, -0.10794662684202194, -0.10391034185886383, -0.09987406432628632, -0.09583777189254761, -0.09180149435997009, -0.08776520937681198, -0.08372892439365387, -0.07969263941049576, -0.07565635442733765, -0.07162006944417953, -0.06758378446102142, -0.06354750692844391, -0.0595112219452858, -0.055474936962127686, -0.051438651978969574, -0.04740236699581146, -0.04336608201265335, -0.03932980075478554, -0.035293515771627426, -0.031257230788469315, -0.027220947667956352, -0.02318466454744339, -0.01914837956428528, -0.015112095512449741, -0.011075811460614204, -0.0070395274087786674, -0.0030032433569431305, 0.001033041626214981, 0.005069324746727943, 0.009105607867240906, 0.013141892850399017, 0.01717817783355713, 0.02121446095407009, 0.025250744074583054, 0.029287029057741165, 0.03332331404089928, 0.03735959529876709, 0.0413958802819252, 0.04543216526508331, 0.049468450248241425, 0.053504735231399536, 0.05754101648926735, 0.06157730147242546, 0.06561358273029327, 0.06964986771345139, 0.0736861526966095, 0.07772243767976761, 0.08175872266292572, 0.08579500764608383, 0.08983129262924194, 0.09386757016181946, 0.09790386259555817, 0.10194014012813568, 0.10597642511129379, 0.1100127100944519]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 6.0, 10.0, 5.0, 11.0, 13.0, 24.0, 28.0, 35.0, 56.0, 103.0, 232.0, 428.0, 889.0, 2100.0, 5769.0, 20888.0, 118417.0, 2623106.0, 1322120.0, 76322.0, 15798.0, 4586.0, 1804.0, 761.0, 318.0, 177.0, 95.0, 63.0, 35.0, 20.0, 18.0, 7.0, 1.0, 4.0, 5.0, 3.0, 7.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.059051513671875, -0.057358741760253906, -0.05566596984863281, -0.05397319793701172, -0.052280426025390625, -0.05058765411376953, -0.04889488220214844, -0.047202110290527344, -0.04550933837890625, -0.043816566467285156, -0.04212379455566406, -0.04043102264404297, -0.038738250732421875, -0.03704547882080078, -0.03535270690917969, -0.033659934997558594, -0.0319671630859375, -0.030274391174316406, -0.028581619262695312, -0.02688884735107422, -0.025196075439453125, -0.02350330352783203, -0.021810531616210938, -0.020117759704589844, -0.01842498779296875, -0.016732215881347656, -0.015039443969726562, -0.013346672058105469, -0.011653900146484375, -0.009961128234863281, -0.008268356323242188, -0.006575584411621094, -0.0048828125, -0.0031900405883789062, -0.0014972686767578125, 0.00019550323486328125, 0.001888275146484375, 0.0035810470581054688, 0.0052738189697265625, 0.006966590881347656, 0.00865936279296875, 0.010352134704589844, 0.012044906616210938, 0.013737678527832031, 0.015430450439453125, 0.01712322235107422, 0.018815994262695312, 0.020508766174316406, 0.0222015380859375, 0.023894309997558594, 0.025587081909179688, 0.02727985382080078, 0.028972625732421875, 0.03066539764404297, 0.03235816955566406, 0.034050941467285156, 0.03574371337890625, 0.037436485290527344, 0.03912925720214844, 0.04082202911376953, 0.042514801025390625, 0.04420757293701172, 0.04590034484863281, 0.047593116760253906, 0.049285888671875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 12.0, 17.0, 21.0, 29.0, 40.0, 45.0, 70.0, 69.0, 77.0, 81.0, 91.0, 94.0, 82.0, 68.0, 55.0, 36.0, 37.0, 18.0, 23.0, 8.0, 3.0, 6.0, 10.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02801513671875, -0.02719402313232422, -0.026372909545898438, -0.025551795959472656, -0.024730682373046875, -0.023909568786621094, -0.023088455200195312, -0.02226734161376953, -0.02144622802734375, -0.02062511444091797, -0.019804000854492188, -0.018982887268066406, -0.018161773681640625, -0.017340660095214844, -0.016519546508789062, -0.01569843292236328, -0.0148773193359375, -0.014056205749511719, -0.013235092163085938, -0.012413978576660156, -0.011592864990234375, -0.010771751403808594, -0.009950637817382812, -0.009129524230957031, -0.00830841064453125, -0.007487297058105469, -0.0066661834716796875, -0.005845069885253906, -0.005023956298828125, -0.004202842712402344, -0.0033817291259765625, -0.0025606155395507812, -0.001739501953125, -0.0009183883666992188, -9.72747802734375e-05, 0.0007238388061523438, 0.001544952392578125, 0.0023660659790039062, 0.0031871795654296875, 0.004008293151855469, 0.00482940673828125, 0.005650520324707031, 0.0064716339111328125, 0.007292747497558594, 0.008113861083984375, 0.008934974670410156, 0.009756088256835938, 0.010577201843261719, 0.0113983154296875, 0.012219429016113281, 0.013040542602539062, 0.013861656188964844, 0.014682769775390625, 0.015503883361816406, 0.016324996948242188, 0.01714611053466797, 0.01796722412109375, 0.01878833770751953, 0.019609451293945312, 0.020430564880371094, 0.021251678466796875, 0.022072792053222656, 0.022893905639648438, 0.02371501922607422, 0.0245361328125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 7.0, 5.0, 14.0, 19.0, 30.0, 35.0, 42.0, 73.0, 113.0, 134.0, 255.0, 399.0, 598.0, 1029.0, 1925.0, 3359.0, 6865.0, 15380.0, 39162.0, 128171.0, 863933.0, 2760871.0, 262753.0, 65462.0, 23211.0, 9703.0, 4736.0, 2475.0, 1355.0, 750.0, 465.0, 312.0, 227.0, 135.0, 90.0, 66.0, 39.0, 32.0, 16.0, 15.0, 10.0, 6.0, 4.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.039764404296875, -0.03860282897949219, -0.037441253662109375, -0.03627967834472656, -0.03511810302734375, -0.03395652770996094, -0.032794952392578125, -0.03163337707519531, -0.0304718017578125, -0.029310226440429688, -0.028148651123046875, -0.026987075805664062, -0.02582550048828125, -0.024663925170898438, -0.023502349853515625, -0.022340774536132812, -0.02117919921875, -0.020017623901367188, -0.018856048583984375, -0.017694473266601562, -0.01653289794921875, -0.015371322631835938, -0.014209747314453125, -0.013048171997070312, -0.0118865966796875, -0.010725021362304688, -0.009563446044921875, -0.008401870727539062, -0.00724029541015625, -0.0060787200927734375, -0.004917144775390625, -0.0037555694580078125, -0.002593994140625, -0.0014324188232421875, -0.000270843505859375, 0.0008907318115234375, 0.00205230712890625, 0.0032138824462890625, 0.004375457763671875, 0.0055370330810546875, 0.0066986083984375, 0.007860183715820312, 0.009021759033203125, 0.010183334350585938, 0.01134490966796875, 0.012506484985351562, 0.013668060302734375, 0.014829635620117188, 0.0159912109375, 0.017152786254882812, 0.018314361572265625, 0.019475936889648438, 0.02063751220703125, 0.021799087524414062, 0.022960662841796875, 0.024122238159179688, 0.0252838134765625, 0.026445388793945312, 0.027606964111328125, 0.028768539428710938, 0.02993011474609375, 0.031091690063476562, 0.032253265380859375, 0.03341484069824219, 0.034576416015625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 10.0, 5.0, 8.0, 11.0, 14.0, 21.0, 44.0, 58.0, 76.0, 108.0, 222.0, 516.0, 1096.0, 836.0, 401.0, 216.0, 139.0, 66.0, 62.0, 49.0, 30.0, 22.0, 18.0, 7.0, 12.0, 11.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04449462890625, -0.04295158386230469, -0.041408538818359375, -0.03986549377441406, -0.03832244873046875, -0.03677940368652344, -0.035236358642578125, -0.03369331359863281, -0.0321502685546875, -0.030607223510742188, -0.029064178466796875, -0.027521133422851562, -0.02597808837890625, -0.024435043334960938, -0.022891998291015625, -0.021348953247070312, -0.019805908203125, -0.018262863159179688, -0.016719818115234375, -0.015176773071289062, -0.01363372802734375, -0.012090682983398438, -0.010547637939453125, -0.009004592895507812, -0.0074615478515625, -0.0059185028076171875, -0.004375457763671875, -0.0028324127197265625, -0.00128936767578125, 0.0002536773681640625, 0.001796722412109375, 0.0033397674560546875, 0.0048828125, 0.0064258575439453125, 0.007968902587890625, 0.009511947631835938, 0.01105499267578125, 0.012598037719726562, 0.014141082763671875, 0.015684127807617188, 0.0172271728515625, 0.018770217895507812, 0.020313262939453125, 0.021856307983398438, 0.02339935302734375, 0.024942398071289062, 0.026485443115234375, 0.028028488159179688, 0.029571533203125, 0.031114578247070312, 0.032657623291015625, 0.03420066833496094, 0.03574371337890625, 0.03728675842285156, 0.038829803466796875, 0.04037284851074219, 0.0419158935546875, 0.04345893859863281, 0.045001983642578125, 0.04654502868652344, 0.04808807373046875, 0.04963111877441406, 0.051174163818359375, 0.05271720886230469, 0.05426025390625]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 5.0, 8.0, 24.0, 62.0, 191.0, 293.0, 239.0, 106.0, 46.0, 16.0, 7.0, 7.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6213767528533936, -0.5994256734848022, -0.5774745345115662, -0.5555234551429749, -0.5335723161697388, -0.5116212368011475, -0.4896700978279114, -0.46771901845932007, -0.445767879486084, -0.4238167703151703, -0.4018656611442566, -0.3799145519733429, -0.3579634428024292, -0.3360123336315155, -0.3140612244606018, -0.2921101450920105, -0.2701590359210968, -0.2482079267501831, -0.2262568175792694, -0.2043057084083557, -0.18235459923744202, -0.16040349006652832, -0.13845239579677582, -0.11650128662586212, -0.09455017745494843, -0.07259906828403473, -0.05064796283841133, -0.028696857392787933, -0.006745748221874237, 0.01520536094903946, 0.03715646266937256, 0.059107571840286255, 0.08105868101119995, 0.10300979018211365, 0.12496089935302734, 0.14691200852394104, 0.16886311769485474, 0.19081422686576843, 0.21276532113552094, 0.23471643030643463, 0.2566675543785095, 0.2786186635494232, 0.3005697727203369, 0.3225208818912506, 0.3444719910621643, 0.366423100233078, 0.3883742094039917, 0.410325288772583, 0.4322763979434967, 0.4542275071144104, 0.4761786162853241, 0.4981297254562378, 0.5200808048248291, 0.5420319437980652, 0.5639830231666565, 0.5859341621398926, 0.6078852415084839, 0.6298363208770752, 0.6517874598503113, 0.6737385392189026, 0.6956896781921387, 0.71764075756073, 0.7395918965339661, 0.7615429759025574, 0.7834941148757935]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 4.0, 4.0, 10.0, 10.0, 12.0, 7.0, 8.0, 17.0, 20.0, 18.0, 23.0, 26.0, 29.0, 28.0, 37.0, 37.0, 37.0, 30.0, 41.0, 52.0, 39.0, 42.0, 42.0, 42.0, 42.0, 34.0, 28.0, 39.0, 34.0, 31.0, 26.0, 31.0, 27.0, 12.0, 18.0, 17.0, 11.0, 4.0, 8.0, 7.0, 7.0, 7.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.14839178323745728, -0.14376282691955566, -0.13913385570049286, -0.13450489938259125, -0.12987592816352844, -0.12524697184562683, -0.12061800807714462, -0.11598904430866241, -0.1113600805401802, -0.106731116771698, -0.10210215300321579, -0.09747318923473358, -0.09284423291683197, -0.08821526169776917, -0.08358630537986755, -0.07895734161138535, -0.07432837784290314, -0.06969941407442093, -0.06507045030593872, -0.06044149026274681, -0.0558125264942646, -0.051183562725782394, -0.046554602682590485, -0.041925638914108276, -0.03729667514562607, -0.03266771137714386, -0.0280387494713068, -0.023409787565469742, -0.018780823796987534, -0.014151860028505325, -0.009522898122668266, -0.004893936216831207, -0.000264972448348999, 0.004363990388810635, 0.008992953225970268, 0.013621916063129902, 0.018250878900289536, 0.022879842668771744, 0.027508804574608803, 0.03213776648044586, 0.03676673024892807, 0.04139569401741028, 0.04602465778589249, 0.050653617829084396, 0.055282581597566605, 0.05991154536604881, 0.06454050540924072, 0.06916946917772293, 0.07379843294620514, 0.07842739671468735, 0.08305636048316956, 0.08768532425165176, 0.09231428802013397, 0.09694324433803558, 0.10157220810651779, 0.106201171875, 0.11083013564348221, 0.11545909941196442, 0.12008806318044662, 0.12471702694892883, 0.12934598326683044, 0.13397495448589325, 0.13860391080379486, 0.14323288202285767, 0.14786183834075928]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 9.0, 12.0, 23.0, 34.0, 42.0, 54.0, 109.0, 174.0, 280.0, 537.0, 1081.0, 2207.0, 5096.0, 11764.0, 30299.0, 81432.0, 217797.0, 360910.0, 209409.0, 78045.0, 28583.0, 11410.0, 4834.0, 2117.0, 1059.0, 499.0, 278.0, 172.0, 101.0, 54.0, 38.0, 29.0, 21.0, 16.0, 10.0, 5.0, 6.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0457763671875, -0.04436683654785156, -0.042957305908203125, -0.04154777526855469, -0.04013824462890625, -0.03872871398925781, -0.037319183349609375, -0.03590965270996094, -0.0345001220703125, -0.03309059143066406, -0.031681060791015625, -0.030271530151367188, -0.02886199951171875, -0.027452468872070312, -0.026042938232421875, -0.024633407592773438, -0.023223876953125, -0.021814346313476562, -0.020404815673828125, -0.018995285034179688, -0.01758575439453125, -0.016176223754882812, -0.014766693115234375, -0.013357162475585938, -0.0119476318359375, -0.010538101196289062, -0.009128570556640625, -0.0077190399169921875, -0.00630950927734375, -0.0048999786376953125, -0.003490447998046875, -0.0020809173583984375, -0.00067138671875, 0.0007381439208984375, 0.002147674560546875, 0.0035572052001953125, 0.00496673583984375, 0.0063762664794921875, 0.007785797119140625, 0.009195327758789062, 0.0106048583984375, 0.012014389038085938, 0.013423919677734375, 0.014833450317382812, 0.01624298095703125, 0.017652511596679688, 0.019062042236328125, 0.020471572875976562, 0.021881103515625, 0.023290634155273438, 0.024700164794921875, 0.026109695434570312, 0.02751922607421875, 0.028928756713867188, 0.030338287353515625, 0.03174781799316406, 0.0331573486328125, 0.03456687927246094, 0.035976409912109375, 0.03738594055175781, 0.03879547119140625, 0.04020500183105469, 0.041614532470703125, 0.04302406311035156, 0.04443359375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 8.0, 11.0, 30.0, 22.0, 24.0, 23.0, 38.0, 50.0, 59.0, 67.0, 70.0, 81.0, 78.0, 75.0, 58.0, 69.0, 55.0, 40.0, 38.0, 22.0, 23.0, 19.0, 8.0, 10.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0297393798828125, -0.028862714767456055, -0.02798604965209961, -0.027109384536743164, -0.02623271942138672, -0.025356054306030273, -0.024479389190673828, -0.023602724075317383, -0.022726058959960938, -0.021849393844604492, -0.020972728729248047, -0.0200960636138916, -0.019219398498535156, -0.01834273338317871, -0.017466068267822266, -0.01658940315246582, -0.015712738037109375, -0.01483607292175293, -0.013959407806396484, -0.013082742691040039, -0.012206077575683594, -0.011329412460327148, -0.010452747344970703, -0.009576082229614258, -0.008699417114257812, -0.007822751998901367, -0.006946086883544922, -0.0060694217681884766, -0.005192756652832031, -0.004316091537475586, -0.0034394264221191406, -0.0025627613067626953, -0.00168609619140625, -0.0008094310760498047, 6.723403930664062e-05, 0.0009438991546630859, 0.0018205642700195312, 0.0026972293853759766, 0.003573894500732422, 0.004450559616088867, 0.0053272247314453125, 0.006203889846801758, 0.007080554962158203, 0.007957220077514648, 0.008833885192871094, 0.009710550308227539, 0.010587215423583984, 0.01146388053894043, 0.012340545654296875, 0.01321721076965332, 0.014093875885009766, 0.014970541000366211, 0.015847206115722656, 0.0167238712310791, 0.017600536346435547, 0.018477201461791992, 0.019353866577148438, 0.020230531692504883, 0.021107196807861328, 0.021983861923217773, 0.02286052703857422, 0.023737192153930664, 0.02461385726928711, 0.025490522384643555, 0.0263671875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 10.0, 13.0, 13.0, 27.0, 45.0, 50.0, 76.0, 148.0, 251.0, 422.0, 748.0, 1251.0, 2399.0, 4937.0, 10298.0, 23436.0, 58591.0, 161400.0, 390717.0, 243671.0, 88304.0, 33674.0, 14338.0, 6455.0, 3250.0, 1716.0, 999.0, 510.0, 316.0, 206.0, 84.0, 63.0, 49.0, 22.0, 15.0, 12.0, 10.0, 4.0, 4.0, 7.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0494384765625, -0.04797172546386719, -0.046504974365234375, -0.04503822326660156, -0.04357147216796875, -0.04210472106933594, -0.040637969970703125, -0.03917121887207031, -0.0377044677734375, -0.03623771667480469, -0.034770965576171875, -0.03330421447753906, -0.03183746337890625, -0.030370712280273438, -0.028903961181640625, -0.027437210083007812, -0.025970458984375, -0.024503707885742188, -0.023036956787109375, -0.021570205688476562, -0.02010345458984375, -0.018636703491210938, -0.017169952392578125, -0.015703201293945312, -0.0142364501953125, -0.012769699096679688, -0.011302947998046875, -0.009836196899414062, -0.00836944580078125, -0.0069026947021484375, -0.005435943603515625, -0.0039691925048828125, -0.00250244140625, -0.0010356903076171875, 0.000431060791015625, 0.0018978118896484375, 0.00336456298828125, 0.0048313140869140625, 0.006298065185546875, 0.0077648162841796875, 0.0092315673828125, 0.010698318481445312, 0.012165069580078125, 0.013631820678710938, 0.01509857177734375, 0.016565322875976562, 0.018032073974609375, 0.019498825073242188, 0.020965576171875, 0.022432327270507812, 0.023899078369140625, 0.025365829467773438, 0.02683258056640625, 0.028299331665039062, 0.029766082763671875, 0.031232833862304688, 0.0326995849609375, 0.03416633605957031, 0.035633087158203125, 0.03709983825683594, 0.03856658935546875, 0.04003334045410156, 0.041500091552734375, 0.04296684265136719, 0.04443359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 3.0, 4.0, 3.0, 6.0, 3.0, 5.0, 7.0, 12.0, 13.0, 17.0, 23.0, 20.0, 34.0, 24.0, 24.0, 45.0, 53.0, 54.0, 73.0, 61.0, 59.0, 52.0, 50.0, 63.0, 44.0, 51.0, 28.0, 25.0, 32.0, 34.0, 25.0, 19.0, 12.0, 9.0, 9.0, 2.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06756591796875, -0.06525611877441406, -0.06294631958007812, -0.06063652038574219, -0.05832672119140625, -0.05601692199707031, -0.053707122802734375, -0.05139732360839844, -0.0490875244140625, -0.04677772521972656, -0.044467926025390625, -0.04215812683105469, -0.03984832763671875, -0.03753852844238281, -0.035228729248046875, -0.03291893005371094, -0.030609130859375, -0.028299331665039062, -0.025989532470703125, -0.023679733276367188, -0.02136993408203125, -0.019060134887695312, -0.016750335693359375, -0.014440536499023438, -0.0121307373046875, -0.009820938110351562, -0.007511138916015625, -0.0052013397216796875, -0.00289154052734375, -0.0005817413330078125, 0.001728057861328125, 0.0040378570556640625, 0.00634765625, 0.008657455444335938, 0.010967254638671875, 0.013277053833007812, 0.01558685302734375, 0.017896652221679688, 0.020206451416015625, 0.022516250610351562, 0.0248260498046875, 0.027135848999023438, 0.029445648193359375, 0.03175544738769531, 0.03406524658203125, 0.03637504577636719, 0.038684844970703125, 0.04099464416503906, 0.043304443359375, 0.04561424255371094, 0.047924041748046875, 0.05023384094238281, 0.05254364013671875, 0.05485343933105469, 0.057163238525390625, 0.05947303771972656, 0.0617828369140625, 0.06409263610839844, 0.06640243530273438, 0.06871223449707031, 0.07102203369140625, 0.07333183288574219, 0.07564163208007812, 0.07795143127441406, 0.08026123046875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 4.0, 3.0, 2.0, 5.0, 12.0, 18.0, 25.0, 40.0, 50.0, 62.0, 107.0, 149.0, 199.0, 358.0, 518.0, 783.0, 1297.0, 2087.0, 3537.0, 6047.0, 11597.0, 23131.0, 57056.0, 193953.0, 472340.0, 174459.0, 53276.0, 21790.0, 10854.0, 5859.0, 3453.0, 2010.0, 1179.0, 759.0, 514.0, 312.0, 233.0, 139.0, 100.0, 72.0, 54.0, 35.0, 19.0, 20.0, 5.0, 8.0, 5.0, 5.0, 8.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0], "bins": [-0.01448822021484375, -0.014041900634765625, -0.0135955810546875, -0.013149261474609375, -0.01270294189453125, -0.012256622314453125, -0.011810302734375, -0.011363983154296875, -0.01091766357421875, -0.010471343994140625, -0.0100250244140625, -0.009578704833984375, -0.00913238525390625, -0.008686065673828125, -0.00823974609375, -0.007793426513671875, -0.00734710693359375, -0.006900787353515625, -0.0064544677734375, -0.006008148193359375, -0.00556182861328125, -0.005115509033203125, -0.004669189453125, -0.004222869873046875, -0.00377655029296875, -0.003330230712890625, -0.0028839111328125, -0.002437591552734375, -0.00199127197265625, -0.001544952392578125, -0.0010986328125, -0.000652313232421875, -0.00020599365234375, 0.000240325927734375, 0.0006866455078125, 0.001132965087890625, 0.00157928466796875, 0.002025604248046875, 0.002471923828125, 0.002918243408203125, 0.00336456298828125, 0.003810882568359375, 0.0042572021484375, 0.004703521728515625, 0.00514984130859375, 0.005596160888671875, 0.00604248046875, 0.006488800048828125, 0.00693511962890625, 0.007381439208984375, 0.0078277587890625, 0.008274078369140625, 0.00872039794921875, 0.009166717529296875, 0.009613037109375, 0.010059356689453125, 0.01050567626953125, 0.010951995849609375, 0.0113983154296875, 0.011844635009765625, 0.01229095458984375, 0.012737274169921875, 0.01318359375, 0.013629913330078125, 0.01407623291015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 4.0, 2.0, 8.0, 8.0, 5.0, 10.0, 10.0, 14.0, 16.0, 33.0, 38.0, 49.0, 52.0, 72.0, 72.0, 74.0, 78.0, 82.0, 75.0, 49.0, 57.0, 35.0, 40.0, 26.0, 12.0, 11.0, 12.0, 7.0, 10.0, 6.0, 5.0, 4.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.838539123535156e-05, -3.711320459842682e-05, -3.5841017961502075e-05, -3.456883132457733e-05, -3.329664468765259e-05, -3.2024458050727844e-05, -3.07522714138031e-05, -2.9480084776878357e-05, -2.8207898139953613e-05, -2.693571150302887e-05, -2.5663524866104126e-05, -2.4391338229179382e-05, -2.311915159225464e-05, -2.1846964955329895e-05, -2.057477831840515e-05, -1.9302591681480408e-05, -1.8030405044555664e-05, -1.675821840763092e-05, -1.5486031770706177e-05, -1.4213845133781433e-05, -1.294165849685669e-05, -1.1669471859931946e-05, -1.0397285223007202e-05, -9.125098586082458e-06, -7.852911949157715e-06, -6.580725312232971e-06, -5.3085386753082275e-06, -4.036352038383484e-06, -2.7641654014587402e-06, -1.4919787645339966e-06, -2.1979212760925293e-07, 1.0523945093154907e-06, 2.3245811462402344e-06, 3.596767783164978e-06, 4.868954420089722e-06, 6.141141057014465e-06, 7.413327693939209e-06, 8.685514330863953e-06, 9.957700967788696e-06, 1.122988760471344e-05, 1.2502074241638184e-05, 1.3774260878562927e-05, 1.5046447515487671e-05, 1.6318634152412415e-05, 1.7590820789337158e-05, 1.8863007426261902e-05, 2.0135194063186646e-05, 2.140738070011139e-05, 2.2679567337036133e-05, 2.3951753973960876e-05, 2.522394061088562e-05, 2.6496127247810364e-05, 2.7768313884735107e-05, 2.904050052165985e-05, 3.0312687158584595e-05, 3.158487379550934e-05, 3.285706043243408e-05, 3.4129247069358826e-05, 3.540143370628357e-05, 3.667362034320831e-05, 3.794580698013306e-05, 3.92179936170578e-05, 4.0490180253982544e-05, 4.176236689090729e-05, 4.303455352783203e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 17.0, 10.0, 9.0, 15.0, 24.0, 31.0, 56.0, 66.0, 118.0, 153.0, 241.0, 328.0, 477.0, 695.0, 1127.0, 1716.0, 2848.0, 4656.0, 8294.0, 15427.0, 31446.0, 70075.0, 175482.0, 372444.0, 205511.0, 81483.0, 35830.0, 17126.0, 9084.0, 5217.0, 3149.0, 1864.0, 1124.0, 801.0, 490.0, 344.0, 250.0, 159.0, 100.0, 82.0, 66.0, 42.0, 35.0, 16.0, 8.0, 9.0, 3.0, 4.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00986480712890625, -0.009552478790283203, -0.009240150451660156, -0.00892782211303711, -0.008615493774414062, -0.008303165435791016, -0.007990837097167969, -0.007678508758544922, -0.007366180419921875, -0.007053852081298828, -0.006741523742675781, -0.006429195404052734, -0.0061168670654296875, -0.005804538726806641, -0.005492210388183594, -0.005179882049560547, -0.0048675537109375, -0.004555225372314453, -0.004242897033691406, -0.003930568695068359, -0.0036182403564453125, -0.0033059120178222656, -0.0029935836791992188, -0.002681255340576172, -0.002368927001953125, -0.002056598663330078, -0.0017442703247070312, -0.0014319419860839844, -0.0011196136474609375, -0.0008072853088378906, -0.0004949569702148438, -0.00018262863159179688, 0.00012969970703125, 0.0004420280456542969, 0.0007543563842773438, 0.0010666847229003906, 0.0013790130615234375, 0.0016913414001464844, 0.0020036697387695312, 0.002315998077392578, 0.002628326416015625, 0.002940654754638672, 0.0032529830932617188, 0.0035653114318847656, 0.0038776397705078125, 0.004189968109130859, 0.004502296447753906, 0.004814624786376953, 0.005126953125, 0.005439281463623047, 0.005751609802246094, 0.006063938140869141, 0.0063762664794921875, 0.006688594818115234, 0.007000923156738281, 0.007313251495361328, 0.007625579833984375, 0.007937908172607422, 0.008250236511230469, 0.008562564849853516, 0.008874893188476562, 0.00918722152709961, 0.009499549865722656, 0.009811878204345703, 0.01012420654296875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 4.0, 1.0, 1.0, 5.0, 8.0, 11.0, 6.0, 15.0, 13.0, 16.0, 29.0, 37.0, 42.0, 64.0, 86.0, 68.0, 87.0, 103.0, 77.0, 61.0, 56.0, 46.0, 33.0, 22.0, 30.0, 13.0, 17.0, 9.0, 6.0, 7.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01485443115234375, -0.014367938041687012, -0.013881444931030273, -0.013394951820373535, -0.012908458709716797, -0.012421965599060059, -0.01193547248840332, -0.011448979377746582, -0.010962486267089844, -0.010475993156433105, -0.009989500045776367, -0.009503006935119629, -0.00901651382446289, -0.008530020713806152, -0.008043527603149414, -0.007557034492492676, -0.0070705413818359375, -0.006584048271179199, -0.006097555160522461, -0.005611062049865723, -0.005124568939208984, -0.004638075828552246, -0.004151582717895508, -0.0036650896072387695, -0.0031785964965820312, -0.002692103385925293, -0.0022056102752685547, -0.0017191171646118164, -0.0012326240539550781, -0.0007461309432983398, -0.00025963783264160156, 0.00022685527801513672, 0.000713348388671875, 0.0011998414993286133, 0.0016863346099853516, 0.00217282772064209, 0.002659320831298828, 0.0031458139419555664, 0.0036323070526123047, 0.004118800163269043, 0.004605293273925781, 0.0050917863845825195, 0.005578279495239258, 0.006064772605895996, 0.006551265716552734, 0.007037758827209473, 0.007524251937866211, 0.00801074504852295, 0.008497238159179688, 0.008983731269836426, 0.009470224380493164, 0.009956717491149902, 0.01044321060180664, 0.010929703712463379, 0.011416196823120117, 0.011902689933776855, 0.012389183044433594, 0.012875676155090332, 0.01336216926574707, 0.013848662376403809, 0.014335155487060547, 0.014821648597717285, 0.015308141708374023, 0.01579463481903076, 0.0162811279296875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 12.0, 23.0, 48.0, 106.0, 204.0, 247.0, 175.0, 92.0, 48.0, 19.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8503850102424622, -0.8307543396949768, -0.8111236095428467, -0.7914929389953613, -0.771862268447876, -0.7522315382957458, -0.7326008677482605, -0.7129701375961304, -0.693339467048645, -0.6737087965011597, -0.6540780663490295, -0.6344473958015442, -0.6148166656494141, -0.5951859951019287, -0.5755553245544434, -0.555924654006958, -0.5362939238548279, -0.5166632533073425, -0.4970325231552124, -0.47740185260772705, -0.4577711522579193, -0.4381404519081116, -0.4185097813606262, -0.3988790810108185, -0.37924838066101074, -0.359617680311203, -0.33998697996139526, -0.3203563094139099, -0.3007256090641022, -0.28109490871429443, -0.2614642381668091, -0.24183353781700134, -0.22220280766487122, -0.20257210731506348, -0.18294142186641693, -0.16331073641777039, -0.14368003606796265, -0.1240493431687355, -0.10441865026950836, -0.08478796482086182, -0.06515726447105408, -0.045526571571826935, -0.025895878672599792, -0.00626518577337265, 0.013365507125854492, 0.032996200025081635, 0.05262689292430878, 0.07225757837295532, 0.09188827872276306, 0.1115189716219902, 0.13114966452121735, 0.1507803499698639, 0.17041105031967163, 0.19004175066947937, 0.20967243611812592, 0.22930312156677246, 0.2489338219165802, 0.26856452226638794, 0.2881951928138733, 0.30782589316368103, 0.32745659351348877, 0.3470872938632965, 0.36671799421310425, 0.3863486647605896, 0.40597936511039734]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 11.0, 11.0, 15.0, 12.0, 19.0, 20.0, 22.0, 22.0, 25.0, 26.0, 35.0, 22.0, 33.0, 38.0, 50.0, 37.0, 52.0, 49.0, 49.0, 47.0, 39.0, 43.0, 42.0, 46.0, 31.0, 28.0, 32.0, 20.0, 16.0, 16.0, 14.0, 15.0, 10.0, 3.0, 14.0, 7.0, 5.0, 7.0, 7.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.20375710725784302, -0.1981145590543747, -0.19247199594974518, -0.18682944774627686, -0.18118689954280853, -0.1755443513393402, -0.1699017882347107, -0.16425924003124237, -0.15861669182777405, -0.15297414362430573, -0.1473315805196762, -0.14168903231620789, -0.13604648411273956, -0.13040393590927124, -0.12476137280464172, -0.1191188246011734, -0.11347626149654388, -0.10783370584249496, -0.10219115763902664, -0.09654860198497772, -0.0909060537815094, -0.08526349812746048, -0.07962094247341156, -0.07397839426994324, -0.06833583861589432, -0.0626932829618454, -0.057050734758377075, -0.051408179104328156, -0.045765627175569534, -0.04012307524681091, -0.03448051959276199, -0.028837967664003372, -0.02319541573524475, -0.01755286380648613, -0.01191031001508236, -0.006267756223678589, -0.0006252042949199677, 0.0050173476338386536, 0.010659903287887573, 0.016302455216646194, 0.021945007145404816, 0.027587559074163437, 0.03323011100292206, 0.03887266665697098, 0.0445152185857296, 0.05015777051448822, 0.05580032616853714, 0.06144287809729576, 0.06708543002605438, 0.0727279856801033, 0.07837053388357162, 0.08401308953762054, 0.08965563774108887, 0.09529819339513779, 0.1009407490491867, 0.10658329725265503, 0.11222585290670395, 0.11786840856075287, 0.12351095676422119, 0.1291535198688507, 0.13479606807231903, 0.14043861627578735, 0.14608117938041687, 0.1517237275838852, 0.15736627578735352]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 9.0, 17.0, 15.0, 26.0, 39.0, 48.0, 78.0, 109.0, 174.0, 286.0, 501.0, 1048.0, 2399.0, 7079.0, 25626.0, 130010.0, 1164291.0, 2472994.0, 320450.0, 50909.0, 11939.0, 3637.0, 1327.0, 570.0, 277.0, 146.0, 78.0, 66.0, 26.0, 28.0, 11.0, 15.0, 11.0, 10.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.07891845703125, -0.07654285430908203, -0.07416725158691406, -0.0717916488647461, -0.06941604614257812, -0.06704044342041016, -0.06466484069824219, -0.06228923797607422, -0.05991363525390625, -0.05753803253173828, -0.05516242980957031, -0.052786827087402344, -0.050411224365234375, -0.048035621643066406, -0.04566001892089844, -0.04328441619873047, -0.0409088134765625, -0.03853321075439453, -0.03615760803222656, -0.033782005310058594, -0.031406402587890625, -0.029030799865722656, -0.026655197143554688, -0.02427959442138672, -0.02190399169921875, -0.01952838897705078, -0.017152786254882812, -0.014777183532714844, -0.012401580810546875, -0.010025978088378906, -0.0076503753662109375, -0.005274772644042969, -0.002899169921875, -0.0005235671997070312, 0.0018520355224609375, 0.004227638244628906, 0.006603240966796875, 0.008978843688964844, 0.011354446411132812, 0.013730049133300781, 0.01610565185546875, 0.01848125457763672, 0.020856857299804688, 0.023232460021972656, 0.025608062744140625, 0.027983665466308594, 0.030359268188476562, 0.03273487091064453, 0.0351104736328125, 0.03748607635498047, 0.03986167907714844, 0.042237281799316406, 0.044612884521484375, 0.046988487243652344, 0.04936408996582031, 0.05173969268798828, 0.05411529541015625, 0.05649089813232422, 0.05886650085449219, 0.061242103576660156, 0.06361770629882812, 0.0659933090209961, 0.06836891174316406, 0.07074451446533203, 0.0731201171875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 8.0, 17.0, 7.0, 19.0, 29.0, 27.0, 48.0, 59.0, 61.0, 51.0, 83.0, 86.0, 84.0, 72.0, 74.0, 59.0, 57.0, 49.0, 24.0, 23.0, 15.0, 20.0, 8.0, 6.0, 5.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.030609130859375, -0.02972888946533203, -0.028848648071289062, -0.027968406677246094, -0.027088165283203125, -0.026207923889160156, -0.025327682495117188, -0.02444744110107422, -0.02356719970703125, -0.02268695831298828, -0.021806716918945312, -0.020926475524902344, -0.020046234130859375, -0.019165992736816406, -0.018285751342773438, -0.01740550994873047, -0.0165252685546875, -0.01564502716064453, -0.014764785766601562, -0.013884544372558594, -0.013004302978515625, -0.012124061584472656, -0.011243820190429688, -0.010363578796386719, -0.00948333740234375, -0.008603096008300781, -0.0077228546142578125, -0.006842613220214844, -0.005962371826171875, -0.005082130432128906, -0.0042018890380859375, -0.0033216476440429688, -0.00244140625, -0.0015611648559570312, -0.0006809234619140625, 0.00019931793212890625, 0.001079559326171875, 0.0019598007202148438, 0.0028400421142578125, 0.0037202835083007812, 0.00460052490234375, 0.005480766296386719, 0.0063610076904296875, 0.007241249084472656, 0.008121490478515625, 0.009001731872558594, 0.009881973266601562, 0.010762214660644531, 0.0116424560546875, 0.012522697448730469, 0.013402938842773438, 0.014283180236816406, 0.015163421630859375, 0.016043663024902344, 0.016923904418945312, 0.01780414581298828, 0.01868438720703125, 0.01956462860107422, 0.020444869995117188, 0.021325111389160156, 0.022205352783203125, 0.023085594177246094, 0.023965835571289062, 0.02484607696533203, 0.025726318359375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 3.0, 7.0, 11.0, 12.0, 31.0, 21.0, 39.0, 47.0, 63.0, 90.0, 132.0, 199.0, 326.0, 555.0, 963.0, 1637.0, 3259.0, 7009.0, 17408.0, 54279.0, 243772.0, 1968113.0, 1610289.0, 208121.0, 48820.0, 15794.0, 6457.0, 3041.0, 1504.0, 868.0, 503.0, 318.0, 198.0, 113.0, 77.0, 62.0, 48.0, 34.0, 14.0, 13.0, 6.0, 7.0, 5.0, 6.0, 3.0, 3.0, 4.0], "bins": [-0.07318115234375, -0.07130241394042969, -0.06942367553710938, -0.06754493713378906, -0.06566619873046875, -0.06378746032714844, -0.061908721923828125, -0.06002998352050781, -0.0581512451171875, -0.05627250671386719, -0.054393768310546875, -0.05251502990722656, -0.05063629150390625, -0.04875755310058594, -0.046878814697265625, -0.04500007629394531, -0.043121337890625, -0.04124259948730469, -0.039363861083984375, -0.03748512268066406, -0.03560638427734375, -0.03372764587402344, -0.031848907470703125, -0.029970169067382812, -0.0280914306640625, -0.026212692260742188, -0.024333953857421875, -0.022455215454101562, -0.02057647705078125, -0.018697738647460938, -0.016819000244140625, -0.014940261840820312, -0.0130615234375, -0.011182785034179688, -0.009304046630859375, -0.0074253082275390625, -0.00554656982421875, -0.0036678314208984375, -0.001789093017578125, 8.96453857421875e-05, 0.0019683837890625, 0.0038471221923828125, 0.005725860595703125, 0.0076045989990234375, 0.00948333740234375, 0.011362075805664062, 0.013240814208984375, 0.015119552612304688, 0.016998291015625, 0.018877029418945312, 0.020755767822265625, 0.022634506225585938, 0.02451324462890625, 0.026391983032226562, 0.028270721435546875, 0.030149459838867188, 0.0320281982421875, 0.03390693664550781, 0.035785675048828125, 0.03766441345214844, 0.03954315185546875, 0.04142189025878906, 0.043300628662109375, 0.04517936706542969, 0.04705810546875]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 7.0, 5.0, 8.0, 12.0, 11.0, 23.0, 20.0, 35.0, 42.0, 85.0, 112.0, 158.0, 216.0, 369.0, 477.0, 615.0, 574.0, 415.0, 288.0, 198.0, 128.0, 94.0, 65.0, 30.0, 39.0, 14.0, 11.0, 9.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0888671875, -0.08607673645019531, -0.08328628540039062, -0.08049583435058594, -0.07770538330078125, -0.07491493225097656, -0.07212448120117188, -0.06933403015136719, -0.0665435791015625, -0.06375312805175781, -0.060962677001953125, -0.05817222595214844, -0.05538177490234375, -0.05259132385253906, -0.049800872802734375, -0.04701042175292969, -0.044219970703125, -0.04142951965332031, -0.038639068603515625, -0.03584861755371094, -0.03305816650390625, -0.030267715454101562, -0.027477264404296875, -0.024686813354492188, -0.0218963623046875, -0.019105911254882812, -0.016315460205078125, -0.013525009155273438, -0.01073455810546875, -0.007944107055664062, -0.005153656005859375, -0.0023632049560546875, 0.00042724609375, 0.0032176971435546875, 0.006008148193359375, 0.008798599243164062, 0.01158905029296875, 0.014379501342773438, 0.017169952392578125, 0.019960403442382812, 0.0227508544921875, 0.025541305541992188, 0.028331756591796875, 0.031122207641601562, 0.03391265869140625, 0.03670310974121094, 0.039493560791015625, 0.04228401184082031, 0.045074462890625, 0.04786491394042969, 0.050655364990234375, 0.05344581604003906, 0.05623626708984375, 0.05902671813964844, 0.061817169189453125, 0.06460762023925781, 0.0673980712890625, 0.07018852233886719, 0.07297897338867188, 0.07576942443847656, 0.07855987548828125, 0.08135032653808594, 0.08414077758789062, 0.08693122863769531, 0.0897216796875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 0.0, 2.0, 3.0, 9.0, 4.0, 9.0, 4.0, 17.0, 10.0, 31.0, 63.0, 77.0, 143.0, 195.0, 154.0, 117.0, 65.0, 39.0, 20.0, 13.0, 5.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5112895965576172, -1.4646813869476318, -1.418073058128357, -1.3714648485183716, -1.3248566389083862, -1.2782483100891113, -1.231640100479126, -1.1850318908691406, -1.1384235620498657, -1.0918153524398804, -1.0452070236206055, -0.9985988140106201, -0.95199054479599, -0.9053822755813599, -0.8587740659713745, -0.8121657967567444, -0.765557587146759, -0.7189493179321289, -0.6723411083221436, -0.6257328391075134, -0.5791245698928833, -0.532516360282898, -0.4859080910682678, -0.4392998218536377, -0.39269158244132996, -0.3460833430290222, -0.2994750738143921, -0.25286683440208435, -0.20625858008861542, -0.15965032577514648, -0.11304208636283875, -0.06643381714820862, -0.01982557773590088, 0.026782672852277756, 0.07339092344045639, 0.11999917030334473, 0.16660742461681366, 0.2132156789302826, 0.25982391834259033, 0.30643218755722046, 0.3530404269695282, 0.39964866638183594, 0.44625693559646606, 0.4928651750087738, 0.5394734144210815, 0.5860816836357117, 0.6326899528503418, 0.6792981624603271, 0.7259064316749573, 0.7725147008895874, 0.8191229104995728, 0.8657311797142029, 0.912339448928833, 0.9589476585388184, 1.0055558681488037, 1.0521641969680786, 1.098772406578064, 1.1453806161880493, 1.1919889450073242, 1.2385971546173096, 1.285205364227295, 1.3318136930465698, 1.3784219026565552, 1.42503023147583, 1.4716384410858154]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 4.0, 4.0, 5.0, 8.0, 9.0, 16.0, 12.0, 20.0, 18.0, 27.0, 20.0, 42.0, 37.0, 37.0, 47.0, 36.0, 51.0, 47.0, 53.0, 60.0, 48.0, 53.0, 42.0, 42.0, 37.0, 43.0, 43.0, 23.0, 25.0, 20.0, 7.0, 11.0, 9.0, 10.0, 7.0, 5.0, 5.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7311837077140808, -0.709852397441864, -0.6885210871696472, -0.6671898365020752, -0.6458585262298584, -0.6245272159576416, -0.6031959056854248, -0.581864595413208, -0.5605332851409912, -0.5392019748687744, -0.5178706645965576, -0.4965393841266632, -0.4752081036567688, -0.453876793384552, -0.4325454831123352, -0.4112141728401184, -0.3898829221725464, -0.3685516119003296, -0.3472203314304352, -0.3258890211582184, -0.304557740688324, -0.2832264304161072, -0.2618951201438904, -0.24056382477283478, -0.21923252940177917, -0.19790123403072357, -0.17656993865966797, -0.15523862838745117, -0.13390733301639557, -0.11257603764533997, -0.09124472737312317, -0.06991343200206757, -0.04858219623565674, -0.027250897139310837, -0.005919598042964935, 0.015411704778671265, 0.03674300014972687, 0.05807429552078247, 0.07940560579299927, 0.10073690116405487, 0.12206819653511047, 0.14339949190616608, 0.16473078727722168, 0.18606209754943848, 0.20739339292049408, 0.22872468829154968, 0.2500559985637665, 0.2713872790336609, 0.2927185893058777, 0.3140498995780945, 0.3353811800479889, 0.3567124903202057, 0.3780437707901001, 0.3993750810623169, 0.4207063913345337, 0.4420377016067505, 0.4633689820766449, 0.4847002923488617, 0.5060315728187561, 0.5273628830909729, 0.5486941933631897, 0.5700254440307617, 0.5913567543029785, 0.6126880645751953, 0.6340193748474121]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 2.0, 11.0, 11.0, 12.0, 20.0, 28.0, 31.0, 59.0, 76.0, 108.0, 180.0, 261.0, 422.0, 767.0, 1141.0, 2044.0, 3597.0, 6721.0, 13598.0, 29668.0, 68375.0, 171617.0, 349458.0, 232430.0, 92371.0, 38830.0, 17592.0, 8572.0, 4423.0, 2440.0, 1362.0, 864.0, 529.0, 329.0, 231.0, 132.0, 83.0, 51.0, 29.0, 13.0, 24.0, 10.0, 11.0, 8.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048095703125, -0.04652738571166992, -0.044959068298339844, -0.043390750885009766, -0.04182243347167969, -0.04025411605834961, -0.03868579864501953, -0.03711748123168945, -0.035549163818359375, -0.0339808464050293, -0.03241252899169922, -0.03084421157836914, -0.029275894165039062, -0.027707576751708984, -0.026139259338378906, -0.024570941925048828, -0.02300262451171875, -0.021434307098388672, -0.019865989685058594, -0.018297672271728516, -0.016729354858398438, -0.01516103744506836, -0.013592720031738281, -0.012024402618408203, -0.010456085205078125, -0.008887767791748047, -0.007319450378417969, -0.005751132965087891, -0.0041828155517578125, -0.0026144981384277344, -0.0010461807250976562, 0.0005221366882324219, 0.0020904541015625, 0.003658771514892578, 0.005227088928222656, 0.006795406341552734, 0.008363723754882812, 0.00993204116821289, 0.011500358581542969, 0.013068675994873047, 0.014636993408203125, 0.016205310821533203, 0.01777362823486328, 0.01934194564819336, 0.020910263061523438, 0.022478580474853516, 0.024046897888183594, 0.025615215301513672, 0.02718353271484375, 0.028751850128173828, 0.030320167541503906, 0.031888484954833984, 0.03345680236816406, 0.03502511978149414, 0.03659343719482422, 0.0381617546081543, 0.039730072021484375, 0.04129838943481445, 0.04286670684814453, 0.04443502426147461, 0.04600334167480469, 0.047571659088134766, 0.049139976501464844, 0.05070829391479492, 0.052276611328125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 9.0, 8.0, 13.0, 14.0, 20.0, 19.0, 27.0, 35.0, 38.0, 40.0, 53.0, 43.0, 60.0, 77.0, 57.0, 66.0, 65.0, 57.0, 61.0, 44.0, 27.0, 31.0, 26.0, 22.0, 10.0, 18.0, 14.0, 5.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0582275390625, -0.05646848678588867, -0.054709434509277344, -0.052950382232666016, -0.05119132995605469, -0.04943227767944336, -0.04767322540283203, -0.0459141731262207, -0.044155120849609375, -0.04239606857299805, -0.04063701629638672, -0.03887796401977539, -0.03711891174316406, -0.035359859466552734, -0.033600807189941406, -0.03184175491333008, -0.03008270263671875, -0.028323650360107422, -0.026564598083496094, -0.024805545806884766, -0.023046493530273438, -0.02128744125366211, -0.01952838897705078, -0.017769336700439453, -0.016010284423828125, -0.014251232147216797, -0.012492179870605469, -0.01073312759399414, -0.008974075317382812, -0.007215023040771484, -0.005455970764160156, -0.003696918487548828, -0.0019378662109375, -0.00017881393432617188, 0.0015802383422851562, 0.0033392906188964844, 0.0050983428955078125, 0.006857395172119141, 0.008616447448730469, 0.010375499725341797, 0.012134552001953125, 0.013893604278564453, 0.01565265655517578, 0.01741170883178711, 0.019170761108398438, 0.020929813385009766, 0.022688865661621094, 0.024447917938232422, 0.02620697021484375, 0.027966022491455078, 0.029725074768066406, 0.031484127044677734, 0.03324317932128906, 0.03500223159790039, 0.03676128387451172, 0.03852033615112305, 0.040279388427734375, 0.0420384407043457, 0.04379749298095703, 0.04555654525756836, 0.04731559753417969, 0.049074649810791016, 0.050833702087402344, 0.05259275436401367, 0.054351806640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 12.0, 14.0, 25.0, 52.0, 118.0, 291.0, 897.0, 4129.0, 39012.0, 930334.0, 66406.0, 5521.0, 1099.0, 367.0, 147.0, 53.0, 28.0, 16.0, 10.0, 7.0, 6.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.340087890625, -0.3289680480957031, -0.31784820556640625, -0.3067283630371094, -0.2956085205078125, -0.2844886779785156, -0.27336883544921875, -0.2622489929199219, -0.251129150390625, -0.24000930786132812, -0.22888946533203125, -0.21776962280273438, -0.2066497802734375, -0.19552993774414062, -0.18441009521484375, -0.17329025268554688, -0.16217041015625, -0.15105056762695312, -0.13993072509765625, -0.12881088256835938, -0.1176910400390625, -0.10657119750976562, -0.09545135498046875, -0.08433151245117188, -0.073211669921875, -0.062091827392578125, -0.05097198486328125, -0.039852142333984375, -0.0287322998046875, -0.017612457275390625, -0.00649261474609375, 0.004627227783203125, 0.0157470703125, 0.026866912841796875, 0.03798675537109375, 0.049106597900390625, 0.0602264404296875, 0.07134628295898438, 0.08246612548828125, 0.09358596801757812, 0.104705810546875, 0.11582565307617188, 0.12694549560546875, 0.13806533813476562, 0.1491851806640625, 0.16030502319335938, 0.17142486572265625, 0.18254470825195312, 0.19366455078125, 0.20478439331054688, 0.21590423583984375, 0.22702407836914062, 0.2381439208984375, 0.24926376342773438, 0.26038360595703125, 0.2715034484863281, 0.282623291015625, 0.2937431335449219, 0.30486297607421875, 0.3159828186035156, 0.3271026611328125, 0.3382225036621094, 0.34934234619140625, 0.3604621887207031, 0.37158203125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 12.0, 14.0, 21.0, 26.0, 39.0, 51.0, 80.0, 83.0, 113.0, 106.0, 101.0, 81.0, 87.0, 56.0, 36.0, 29.0, 20.0, 20.0, 8.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45751953125, -0.44249725341796875, -0.4274749755859375, -0.41245269775390625, -0.397430419921875, -0.38240814208984375, -0.3673858642578125, -0.35236358642578125, -0.33734130859375, -0.32231903076171875, -0.3072967529296875, -0.29227447509765625, -0.277252197265625, -0.26222991943359375, -0.2472076416015625, -0.23218536376953125, -0.2171630859375, -0.20214080810546875, -0.1871185302734375, -0.17209625244140625, -0.157073974609375, -0.14205169677734375, -0.1270294189453125, -0.11200714111328125, -0.09698486328125, -0.08196258544921875, -0.0669403076171875, -0.05191802978515625, -0.036895751953125, -0.02187347412109375, -0.0068511962890625, 0.00817108154296875, 0.023193359375, 0.03821563720703125, 0.0532379150390625, 0.06826019287109375, 0.083282470703125, 0.09830474853515625, 0.1133270263671875, 0.12834930419921875, 0.14337158203125, 0.15839385986328125, 0.1734161376953125, 0.18843841552734375, 0.203460693359375, 0.21848297119140625, 0.2335052490234375, 0.24852752685546875, 0.2635498046875, 0.27857208251953125, 0.2935943603515625, 0.30861663818359375, 0.323638916015625, 0.33866119384765625, 0.3536834716796875, 0.36870574951171875, 0.38372802734375, 0.39875030517578125, 0.4137725830078125, 0.42879486083984375, 0.443817138671875, 0.45883941650390625, 0.4738616943359375, 0.48888397216796875, 0.50390625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 15.0, 47.0, 285.0, 11011.0, 1036186.0, 856.0, 90.0, 20.0, 8.0, 4.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3173828125, -1.2776947021484375, -1.238006591796875, -1.1983184814453125, -1.15863037109375, -1.1189422607421875, -1.079254150390625, -1.0395660400390625, -0.9998779296875, -0.9601898193359375, -0.920501708984375, -0.8808135986328125, -0.84112548828125, -0.8014373779296875, -0.761749267578125, -0.7220611572265625, -0.682373046875, -0.6426849365234375, -0.602996826171875, -0.5633087158203125, -0.52362060546875, -0.4839324951171875, -0.444244384765625, -0.4045562744140625, -0.3648681640625, -0.3251800537109375, -0.285491943359375, -0.2458038330078125, -0.20611572265625, -0.1664276123046875, -0.126739501953125, -0.0870513916015625, -0.04736328125, -0.0076751708984375, 0.032012939453125, 0.0717010498046875, 0.11138916015625, 0.1510772705078125, 0.190765380859375, 0.2304534912109375, 0.2701416015625, 0.3098297119140625, 0.349517822265625, 0.3892059326171875, 0.42889404296875, 0.4685821533203125, 0.508270263671875, 0.5479583740234375, 0.587646484375, 0.6273345947265625, 0.667022705078125, 0.7067108154296875, 0.74639892578125, 0.7860870361328125, 0.825775146484375, 0.8654632568359375, 0.9051513671875, 0.9448394775390625, 0.984527587890625, 1.0242156982421875, 1.06390380859375, 1.1035919189453125, 1.143280029296875, 1.1829681396484375, 1.22265625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 3.0, 6.0, 4.0, 5.0, 11.0, 9.0, 20.0, 25.0, 26.0, 42.0, 64.0, 97.0, 149.0, 132.0, 95.0, 68.0, 54.0, 26.0, 26.0, 14.0, 16.0, 29.0, 15.0, 11.0, 5.0, 3.0, 3.0, 4.0, 0.0, 4.0, 7.0, 6.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.002187728881836e-05, -5.820672959089279e-05, -5.6391581892967224e-05, -5.4576434195041656e-05, -5.276128649711609e-05, -5.094613879919052e-05, -4.9130991101264954e-05, -4.7315843403339386e-05, -4.550069570541382e-05, -4.368554800748825e-05, -4.187040030956268e-05, -4.0055252611637115e-05, -3.824010491371155e-05, -3.642495721578598e-05, -3.460980951786041e-05, -3.2794661819934845e-05, -3.097951412200928e-05, -2.916436642408371e-05, -2.7349218726158142e-05, -2.5534071028232574e-05, -2.3718923330307007e-05, -2.190377563238144e-05, -2.008862793445587e-05, -1.8273480236530304e-05, -1.6458332538604736e-05, -1.4643184840679169e-05, -1.2828037142753601e-05, -1.1012889444828033e-05, -9.197741746902466e-06, -7.382594048976898e-06, -5.5674463510513306e-06, -3.752298653125763e-06, -1.9371509552001953e-06, -1.2200325727462769e-07, 1.69314444065094e-06, 3.5082921385765076e-06, 5.323439836502075e-06, 7.138587534427643e-06, 8.95373523235321e-06, 1.0768882930278778e-05, 1.2584030628204346e-05, 1.4399178326129913e-05, 1.621432602405548e-05, 1.802947372198105e-05, 1.9844621419906616e-05, 2.1659769117832184e-05, 2.347491681575775e-05, 2.529006451368332e-05, 2.7105212211608887e-05, 2.8920359909534454e-05, 3.073550760746002e-05, 3.255065530538559e-05, 3.436580300331116e-05, 3.6180950701236725e-05, 3.799609839916229e-05, 3.981124609708786e-05, 4.162639379501343e-05, 4.3441541492938995e-05, 4.525668919086456e-05, 4.707183688879013e-05, 4.88869845867157e-05, 5.0702132284641266e-05, 5.2517279982566833e-05, 5.43324276804924e-05, 5.614757537841797e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 7.0, 9.0, 14.0, 22.0, 30.0, 47.0, 70.0, 101.0, 150.0, 284.0, 583.0, 1285.0, 4076.0, 25295.0, 911072.0, 94071.0, 7750.0, 2018.0, 791.0, 350.0, 175.0, 122.0, 81.0, 40.0, 29.0, 19.0, 16.0, 8.0, 14.0, 9.0, 7.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11383056640625, -0.10940265655517578, -0.10497474670410156, -0.10054683685302734, -0.09611892700195312, -0.0916910171508789, -0.08726310729980469, -0.08283519744873047, -0.07840728759765625, -0.07397937774658203, -0.06955146789550781, -0.0651235580444336, -0.060695648193359375, -0.056267738342285156, -0.05183982849121094, -0.04741191864013672, -0.0429840087890625, -0.03855609893798828, -0.03412818908691406, -0.029700279235839844, -0.025272369384765625, -0.020844459533691406, -0.016416549682617188, -0.011988639831542969, -0.00756072998046875, -0.0031328201293945312, 0.0012950897216796875, 0.005722999572753906, 0.010150909423828125, 0.014578819274902344, 0.019006729125976562, 0.02343463897705078, 0.027862548828125, 0.03229045867919922, 0.03671836853027344, 0.041146278381347656, 0.045574188232421875, 0.050002098083496094, 0.05443000793457031, 0.05885791778564453, 0.06328582763671875, 0.06771373748779297, 0.07214164733886719, 0.0765695571899414, 0.08099746704101562, 0.08542537689208984, 0.08985328674316406, 0.09428119659423828, 0.0987091064453125, 0.10313701629638672, 0.10756492614746094, 0.11199283599853516, 0.11642074584960938, 0.1208486557006836, 0.1252765655517578, 0.12970447540283203, 0.13413238525390625, 0.13856029510498047, 0.1429882049560547, 0.1474161148071289, 0.15184402465820312, 0.15627193450927734, 0.16069984436035156, 0.16512775421142578, 0.1695556640625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 7.0, 10.0, 17.0, 26.0, 49.0, 69.0, 131.0, 277.0, 187.0, 95.0, 46.0, 27.0, 23.0, 10.0, 10.0, 10.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.183837890625, -0.176666259765625, -0.16949462890625, -0.162322998046875, -0.1551513671875, -0.147979736328125, -0.14080810546875, -0.133636474609375, -0.12646484375, -0.119293212890625, -0.11212158203125, -0.104949951171875, -0.0977783203125, -0.090606689453125, -0.08343505859375, -0.076263427734375, -0.069091796875, -0.061920166015625, -0.05474853515625, -0.047576904296875, -0.0404052734375, -0.033233642578125, -0.02606201171875, -0.018890380859375, -0.01171875, -0.004547119140625, 0.00262451171875, 0.009796142578125, 0.0169677734375, 0.024139404296875, 0.03131103515625, 0.038482666015625, 0.045654296875, 0.052825927734375, 0.05999755859375, 0.067169189453125, 0.0743408203125, 0.081512451171875, 0.08868408203125, 0.095855712890625, 0.10302734375, 0.110198974609375, 0.11737060546875, 0.124542236328125, 0.1317138671875, 0.138885498046875, 0.14605712890625, 0.153228759765625, 0.160400390625, 0.167572021484375, 0.17474365234375, 0.181915283203125, 0.1890869140625, 0.196258544921875, 0.20343017578125, 0.210601806640625, 0.2177734375, 0.224945068359375, 0.23211669921875, 0.239288330078125, 0.2464599609375, 0.253631591796875, 0.26080322265625, 0.267974853515625, 0.275146484375]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 8.0, 10.0, 17.0, 27.0, 109.0, 367.0, 287.0, 104.0, 39.0, 12.0, 15.0, 5.0, 5.0, 7.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.168622970581055, -6.036830425262451, -5.905038356781006, -5.773245811462402, -5.641453266143799, -5.509660720825195, -5.37786865234375, -5.2460761070251465, -5.114283561706543, -4.9824910163879395, -4.850698947906494, -4.718906402587891, -4.587113857269287, -4.455321311950684, -4.323529243469238, -4.191736698150635, -4.059944152832031, -3.928151845932007, -3.7963593006134033, -3.664566993713379, -3.5327744483947754, -3.400982141494751, -3.2691898345947266, -3.137397289276123, -3.0056052207946777, -2.8738129138946533, -2.74202036857605, -2.6102280616760254, -2.478435516357422, -2.3466432094573975, -2.214850902557373, -2.0830583572387695, -1.951265811920166, -1.819473385810852, -1.687680959701538, -1.5558886528015137, -1.4240961074829102, -1.2923038005828857, -1.1605113744735718, -1.0287189483642578, -0.8969265222549438, -0.7651340961456299, -0.6333416700363159, -0.5015493035316467, -0.36975687742233276, -0.2379644513130188, -0.10617208480834961, 0.025620341300964355, 0.15741276741027832, 0.2892051935195923, 0.42099758982658386, 0.5527899861335754, 0.6845824122428894, 0.8163748383522034, 0.9481672048568726, 1.0799596309661865, 1.2117520570755005, 1.3435444831848145, 1.4753369092941284, 1.6071293354034424, 1.7389216423034668, 1.8707141876220703, 2.0025064945220947, 2.134298801422119, 2.2660913467407227]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 8.0, 20.0, 20.0, 38.0, 75.0, 104.0, 133.0, 182.0, 134.0, 95.0, 77.0, 40.0, 29.0, 10.0, 14.0, 5.0, 8.0, 1.0, 5.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.509722709655762, -4.4109601974487305, -4.312197685241699, -4.213435649871826, -4.114673137664795, -4.015910625457764, -3.9171481132507324, -3.8183858394622803, -3.719623565673828, -3.620861053466797, -3.5220987796783447, -3.4233362674713135, -3.3245739936828613, -3.22581148147583, -3.127048969268799, -3.0282866954803467, -2.9295241832733154, -2.830761671066284, -2.731999397277832, -2.633236885070801, -2.5344746112823486, -2.4357120990753174, -2.3369498252868652, -2.238187313079834, -2.1394248008728027, -2.0406622886657715, -1.9419000148773193, -1.843137502670288, -1.744375228881836, -1.6456127166748047, -1.546850323677063, -1.4480879306793213, -1.3493256568908691, -1.2505632638931274, -1.1518008708953857, -1.0530383586883545, -0.9542760252952576, -0.8555136322975159, -0.7567511796951294, -0.6579887866973877, -0.559226393699646, -0.4604640007019043, -0.3617015779018402, -0.2629391551017761, -0.16417676210403442, -0.06541436910629272, 0.03334808349609375, 0.13211047649383545, 0.23087286949157715, 0.32963526248931885, 0.42839768528938293, 0.527160108089447, 0.6259225010871887, 0.7246848940849304, 0.8234473466873169, 0.9222097396850586, 1.0209721326828003, 1.119734525680542, 1.2184969186782837, 1.3172593116760254, 1.4160218238830566, 1.5147840976715088, 1.61354660987854, 1.7123090028762817, 1.8110713958740234]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 12.0, 19.0, 25.0, 47.0, 87.0, 514.0, 160.0, 50.0, 31.0, 20.0, 14.0, 10.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39697265625, -0.3882732391357422, -0.3795738220214844, -0.37087440490722656, -0.36217498779296875, -0.35347557067871094, -0.3447761535644531, -0.3360767364501953, -0.3273773193359375, -0.3186779022216797, -0.3099784851074219, -0.30127906799316406, -0.29257965087890625, -0.28388023376464844, -0.2751808166503906, -0.2664813995361328, -0.257781982421875, -0.2490825653076172, -0.24038314819335938, -0.23168373107910156, -0.22298431396484375, -0.21428489685058594, -0.20558547973632812, -0.1968860626220703, -0.1881866455078125, -0.1794872283935547, -0.17078781127929688, -0.16208839416503906, -0.15338897705078125, -0.14468955993652344, -0.13599014282226562, -0.1272907257080078, -0.11859130859375, -0.10989189147949219, -0.10119247436523438, -0.09249305725097656, -0.08379364013671875, -0.07509422302246094, -0.06639480590820312, -0.05769538879394531, -0.0489959716796875, -0.04029655456542969, -0.031597137451171875, -0.022897720336914062, -0.01419830322265625, -0.0054988861083984375, 0.003200531005859375, 0.011899948120117188, 0.020599365234375, 0.029298782348632812, 0.037998199462890625, 0.04669761657714844, 0.05539703369140625, 0.06409645080566406, 0.07279586791992188, 0.08149528503417969, 0.0901947021484375, 0.09889411926269531, 0.10759353637695312, 0.11629295349121094, 0.12499237060546875, 0.13369178771972656, 0.14239120483398438, 0.1510906219482422, 0.1597900390625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 3.0, 5.0, 4.0, 5.0, 7.0, 11.0, 10.0, 10.0, 18.0, 21.0, 25.0, 38.0, 60.0, 70.0, 168.0, 378.0, 1090.0, 6216.0, 8342106.0, 35168.0, 2223.0, 564.0, 195.0, 69.0, 35.0, 27.0, 15.0, 13.0, 8.0, 4.0, 4.0, 5.0, 7.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9338787794113159, -0.9091488122940063, -0.884418785572052, -0.8596888184547424, -0.8349588513374329, -0.8102288246154785, -0.785498857498169, -0.7607688903808594, -0.7360389232635498, -0.7113089561462402, -0.6865789294242859, -0.6618489623069763, -0.6371189951896667, -0.6123889684677124, -0.5876590013504028, -0.5629290342330933, -0.5381990075111389, -0.5134690403938293, -0.4887390434741974, -0.46400904655456543, -0.43927907943725586, -0.4145490825176239, -0.38981908559799194, -0.3650891184806824, -0.3403591215610504, -0.31562912464141846, -0.2908991575241089, -0.26616916060447693, -0.24143917858600616, -0.2167091965675354, -0.19197919964790344, -0.16724921762943268, -0.14251917600631714, -0.11778919398784637, -0.09305920451879501, -0.06832921504974365, -0.04359923303127289, -0.018869251012802124, 0.005860745906829834, 0.030590727925300598, 0.05532070994377136, 0.08005069196224213, 0.10478068143129349, 0.12951067090034485, 0.1542406529188156, 0.17897063493728638, 0.20370063185691833, 0.2284306138753891, 0.25316059589385986, 0.2778905928134918, 0.3026205599308014, 0.32735055685043335, 0.3520805239677429, 0.3768105208873749, 0.40154051780700684, 0.4262704849243164, 0.45100048184394836, 0.4757304787635803, 0.5004604458808899, 0.5251904726028442, 0.5499204397201538, 0.5746504068374634, 0.599380373954773, 0.6241104006767273, 0.6488403677940369]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 1.0, 4.0, 7.0, 4.0, 5.0, 3.0, 8.0, 2.0, 2.0, 5.0, 3.0, 5.0, 3.0, 1.0, 3.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-0.6906124353408813, -0.6626277565956116, -0.6346430778503418, -0.606658399105072, -0.5786737203598022, -0.5506890416145325, -0.5227043628692627, -0.4947196841239929, -0.46673500537872314, -0.43875032663345337, -0.4107656478881836, -0.3827809691429138, -0.35479629039764404, -0.32681161165237427, -0.2988269329071045, -0.2708422541618347, -0.24285760521888733, -0.21487292647361755, -0.18688824772834778, -0.158903568983078, -0.13091889023780823, -0.10293422639369965, -0.07494954764842987, -0.046964868903160095, -0.01898019015789032, 0.009004486724734306, 0.03698916360735893, 0.06497383862733841, 0.09295851737260818, 0.12094318866729736, 0.14892786741256714, 0.17691254615783691, 0.2048972249031067, 0.23288190364837646, 0.26086658239364624, 0.288851261138916, 0.3168359398841858, 0.34482061862945557, 0.37280529737472534, 0.4007899761199951, 0.4287746548652649, 0.45675933361053467, 0.48474401235580444, 0.5127286911010742, 0.540713369846344, 0.5686980485916138, 0.5966827273368835, 0.6246674060821533, 0.6526520252227783, 0.6806367039680481, 0.7086213827133179, 0.7366060614585876, 0.7645907402038574, 0.7925754189491272, 0.820560097694397, 0.8485447764396667, 0.8765294551849365, 0.9045141339302063, 0.9324988126754761, 0.9604834914207458, 0.9884681701660156, 1.0164527893066406, 1.0444375276565552, 1.0724221467971802, 1.1004068851470947]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 3.0, 15.0, 26.0, 43.0, 55.0, 119.0, 143.0, 221.0, 154.0, 93.0, 50.0, 38.0, 18.0, 15.0, 4.0, 6.0, 1.0, 1.0, 3.0], "bins": [-0.1612548828125, -0.15816259384155273, -0.15507030487060547, -0.1519780158996582, -0.14888572692871094, -0.14579343795776367, -0.1427011489868164, -0.13960886001586914, -0.13651657104492188, -0.1334242820739746, -0.13033199310302734, -0.12723970413208008, -0.12414741516113281, -0.12105512619018555, -0.11796283721923828, -0.11487054824829102, -0.11177825927734375, -0.10868597030639648, -0.10559368133544922, -0.10250139236450195, -0.09940910339355469, -0.09631681442260742, -0.09322452545166016, -0.09013223648071289, -0.08703994750976562, -0.08394765853881836, -0.0808553695678711, -0.07776308059692383, -0.07467079162597656, -0.0715785026550293, -0.06848621368408203, -0.06539392471313477, -0.0623016357421875, -0.059209346771240234, -0.05611705780029297, -0.0530247688293457, -0.04993247985839844, -0.04684019088745117, -0.043747901916503906, -0.04065561294555664, -0.037563323974609375, -0.03447103500366211, -0.031378746032714844, -0.028286457061767578, -0.025194168090820312, -0.022101879119873047, -0.01900959014892578, -0.015917301177978516, -0.01282501220703125, -0.009732723236083984, -0.006640434265136719, -0.003548145294189453, -0.0004558563232421875, 0.002636432647705078, 0.005728721618652344, 0.00882101058959961, 0.011913299560546875, 0.01500558853149414, 0.018097877502441406, 0.021190166473388672, 0.024282455444335938, 0.027374744415283203, 0.03046703338623047, 0.033559322357177734, 0.036651611328125]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 1.0, 3.0, 5.0, 7.0, 16.0, 21.0, 14.0, 26.0, 34.0, 53.0, 80.0, 127.0, 175.0, 297.0, 509.0, 974.0, 2094.0, 5245.0, 15983.0, 69484.0, 304697.0, 94006.0, 20029.0, 5958.0, 2261.0, 955.0, 486.0, 250.0, 159.0, 102.0, 70.0, 44.0, 25.0, 26.0, 14.0, 16.0, 7.0, 10.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.037109375, -1.0115585327148438, -0.9860076904296875, -0.9604568481445312, -0.934906005859375, -0.9093551635742188, -0.8838043212890625, -0.8582534790039062, -0.83270263671875, -0.8071517944335938, -0.7816009521484375, -0.7560501098632812, -0.730499267578125, -0.7049484252929688, -0.6793975830078125, -0.6538467407226562, -0.6282958984375, -0.6027450561523438, -0.5771942138671875, -0.5516433715820312, -0.526092529296875, -0.5005416870117188, -0.4749908447265625, -0.44944000244140625, -0.42388916015625, -0.39833831787109375, -0.3727874755859375, -0.34723663330078125, -0.321685791015625, -0.29613494873046875, -0.2705841064453125, -0.24503326416015625, -0.219482421875, -0.19393157958984375, -0.1683807373046875, -0.14282989501953125, -0.117279052734375, -0.09172821044921875, -0.0661773681640625, -0.04062652587890625, -0.01507568359375, 0.01047515869140625, 0.0360260009765625, 0.06157684326171875, 0.087127685546875, 0.11267852783203125, 0.1382293701171875, 0.16378021240234375, 0.1893310546875, 0.21488189697265625, 0.2404327392578125, 0.26598358154296875, 0.291534423828125, 0.31708526611328125, 0.3426361083984375, 0.36818695068359375, 0.39373779296875, 0.41928863525390625, 0.4448394775390625, 0.47039031982421875, 0.495941162109375, 0.5214920043945312, 0.5470428466796875, 0.5725936889648438, 0.59814453125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 1.0, 14.0, 9.0, 18.0, 24.0, 41.0, 49.0, 77.0, 110.0, 131.0, 134.0, 133.0, 72.0, 51.0, 41.0, 25.0, 14.0, 20.0, 2.0, 5.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.251953125, -0.24603843688964844, -0.24012374877929688, -0.2342090606689453, -0.22829437255859375, -0.2223796844482422, -0.21646499633789062, -0.21055030822753906, -0.2046356201171875, -0.19872093200683594, -0.19280624389648438, -0.1868915557861328, -0.18097686767578125, -0.1750621795654297, -0.16914749145507812, -0.16323280334472656, -0.157318115234375, -0.15140342712402344, -0.14548873901367188, -0.1395740509033203, -0.13365936279296875, -0.1277446746826172, -0.12182998657226562, -0.11591529846191406, -0.1100006103515625, -0.10408592224121094, -0.09817123413085938, -0.09225654602050781, -0.08634185791015625, -0.08042716979980469, -0.07451248168945312, -0.06859779357910156, -0.06268310546875, -0.05676841735839844, -0.050853729248046875, -0.04493904113769531, -0.03902435302734375, -0.03310966491699219, -0.027194976806640625, -0.021280288696289062, -0.0153656005859375, -0.009450912475585938, -0.003536224365234375, 0.0023784637451171875, 0.00829315185546875, 0.014207839965820312, 0.020122528076171875, 0.026037216186523438, 0.031951904296875, 0.03786659240722656, 0.043781280517578125, 0.04969596862792969, 0.05561065673828125, 0.06152534484863281, 0.06744003295898438, 0.07335472106933594, 0.0792694091796875, 0.08518409729003906, 0.09109878540039062, 0.09701347351074219, 0.10292816162109375, 0.10884284973144531, 0.11475753784179688, 0.12067222595214844, 0.1265869140625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 9.0, 6.0, 4.0, 10.0, 19.0, 14.0, 24.0, 30.0, 37.0, 42.0, 34.0, 39.0, 38.0, 38.0, 22.0, 20.0, 21.0, 16.0, 12.0, 11.0, 12.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.4283409118652344, -0.4173845648765564, -0.4064282178878784, -0.39547187089920044, -0.38451555371284485, -0.37355920672416687, -0.3626028597354889, -0.3516465127468109, -0.3406901955604553, -0.32973384857177734, -0.31877750158309937, -0.3078211545944214, -0.2968648374080658, -0.2859084904193878, -0.27495214343070984, -0.26399579644203186, -0.2530394494533539, -0.2420831024646759, -0.23112677037715912, -0.22017042338848114, -0.20921409130096436, -0.19825774431228638, -0.1873013973236084, -0.17634505033493042, -0.16538871824741364, -0.15443237125873566, -0.14347603917121887, -0.1325196921825409, -0.12156335264444351, -0.11060701310634613, -0.09965066611766815, -0.08869432657957077, -0.077737957239151, -0.06678161770105362, -0.05582527443766594, -0.04486893117427826, -0.03391259163618088, -0.022956252098083496, -0.011999905109405518, -0.001043565571308136, 0.009912773966789246, 0.020869115367531776, 0.03182545676827431, 0.04278180003166199, 0.05373813956975937, 0.06469447910785675, 0.07565082609653473, 0.08660716563463211, 0.09756350517272949, 0.10851984471082687, 0.11947618424892426, 0.13043253123760223, 0.14138886332511902, 0.152345210313797, 0.16330155730247498, 0.17425790429115295, 0.18521423637866974, 0.19617058336734772, 0.2071269154548645, 0.21808326244354248, 0.22903960943222046, 0.23999594151973724, 0.2509523034095764, 0.261908620595932, 0.27286496758461]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 3.0, 3.0, 10.0, 8.0, 20.0, 12.0, 12.0, 18.0, 14.0, 23.0, 41.0, 37.0, 37.0, 39.0, 25.0, 31.0, 21.0, 27.0, 9.0, 21.0, 13.0, 13.0, 8.0, 12.0, 7.0, 5.0, 3.0, 5.0, 5.0, 5.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7345180511474609, -0.7138820290565491, -0.693246066570282, -0.6726100444793701, -0.651974081993103, -0.6313380599021912, -0.6107020378112793, -0.5900660753250122, -0.5694300532341003, -0.5487940311431885, -0.5281580686569214, -0.5075220465660095, -0.48688605427742004, -0.46625006198883057, -0.4456140398979187, -0.4249780476093292, -0.40434205532073975, -0.38370606303215027, -0.3630700707435608, -0.3424340486526489, -0.32179805636405945, -0.30116206407546997, -0.2805260419845581, -0.25989004969596863, -0.23925405740737915, -0.21861806511878967, -0.197982057929039, -0.17734605073928833, -0.15671005845069885, -0.13607406616210938, -0.1154380589723587, -0.09480205178260803, -0.07416605949401855, -0.05353005975484848, -0.032894060015678406, -0.012258060276508331, 0.008377939462661743, 0.029013939201831818, 0.04964993894100189, 0.07028594613075256, 0.09092193841934204, 0.11155793815851212, 0.1321939378976822, 0.15282994508743286, 0.17346593737602234, 0.19410192966461182, 0.2147379368543625, 0.23537394404411316, 0.25600993633270264, 0.2766459286212921, 0.2972819209098816, 0.31791794300079346, 0.33855393528938293, 0.3591899275779724, 0.3798259496688843, 0.40046194195747375, 0.42109793424606323, 0.4417339265346527, 0.4623699188232422, 0.48300594091415405, 0.5036419630050659, 0.524277925491333, 0.5449139475822449, 0.5655499696731567, 0.5861859321594238]}, "eval/loss": 4.281228065490723, "eval/bleu": 0.0, "eval/runtime": 2569.7097, "eval/samples_per_second": 5.744, "eval/steps_per_second": 0.718} \ No newline at end of file