diff --git "a/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" "b/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220326_171130-bdf5nvyg/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.4437, "train/learning_rate": 0.0002988, "train/epoch": 2.24, "train/global_step": 500, "_runtime": 11409, "_timestamp": 1648326099, "_step": 500, "gradients/decoder.model.decoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 19.0, 57.0, 115.0, 203.0, 231.0, 176.0, 113.0, 47.0, 20.0, 13.0, 9.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.956857681274414, -27.012638092041016, -26.068418502807617, -25.12419891357422, -24.17997932434082, -23.235759735107422, -22.291542053222656, -21.347320556640625, -20.40310287475586, -19.45888328552246, -18.514663696289062, -17.570444107055664, -16.626224517822266, -15.682004928588867, -14.737786293029785, -13.793566703796387, -12.849346160888672, -11.905126571655273, -10.960906982421875, -10.016687393188477, -9.072467803955078, -8.12824821472168, -7.184029579162598, -6.239809989929199, -5.295590400695801, -4.351370811462402, -3.407151460647583, -2.4629321098327637, -1.5187125205993652, -0.5744929313659668, 0.36972618103027344, 1.3139457702636719, 2.258167266845703, 3.2023868560791016, 4.1466064453125, 5.09082555770874, 6.035045146942139, 6.979264736175537, 7.923483848571777, 8.867703437805176, 9.811923027038574, 10.756142616271973, 11.700362205505371, 12.644580841064453, 13.588800430297852, 14.53302001953125, 15.477239608764648, 16.421459197998047, 17.365678787231445, 18.309898376464844, 19.254117965698242, 20.19833755493164, 21.14255714416504, 22.086776733398438, 23.030994415283203, 23.975215911865234, 24.91943359375, 25.8636531829834, 26.807872772216797, 27.752092361450195, 28.696311950683594, 29.640531539916992, 30.58475112915039, 31.528968811035156, 32.47319030761719]}, "gradients/decoder.model.decoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 5.0, 10.0, 12.0, 16.0, 17.0, 28.0, 21.0, 25.0, 43.0, 54.0, 38.0, 40.0, 59.0, 53.0, 61.0, 54.0, 58.0, 58.0, 52.0, 49.0, 47.0, 42.0, 32.0, 22.0, 27.0, 16.0, 15.0, 11.0, 9.0, 6.0, 5.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-26.317832946777344, -25.64121437072754, -24.964595794677734, -24.287975311279297, -23.611356735229492, -22.934738159179688, -22.258119583129883, -21.581501007080078, -20.90488052368164, -20.228261947631836, -19.55164337158203, -18.875022888183594, -18.19840431213379, -17.521785736083984, -16.84516716003418, -16.168548583984375, -15.49193000793457, -14.815311431884766, -14.138691902160645, -13.46207332611084, -12.785453796386719, -12.108835220336914, -11.43221664428711, -10.755598068237305, -10.078978538513184, -9.402359962463379, -8.725740432739258, -8.049121856689453, -7.37250280380249, -6.695883750915527, -6.019265174865723, -5.34264612197876, -4.666025161743164, -3.989406108856201, -3.3127872943878174, -2.6361684799194336, -1.9595494270324707, -1.2829303741455078, -0.6063117980957031, 0.07030725479125977, 0.7469263076782227, 1.423545241355896, 2.1001641750335693, 2.776782989501953, 3.453402042388916, 4.130021095275879, 4.806639671325684, 5.4832587242126465, 6.159877777099609, 6.836496829986572, 7.513115882873535, 8.18973445892334, 8.866353988647461, 9.542972564697266, 10.21959114074707, 10.896209716796875, 11.572829246520996, 12.2494478225708, 12.926067352294922, 13.602685928344727, 14.279304504394531, 14.955924034118652, 15.632542610168457, 16.309162139892578, 16.985780715942383]}, "gradients/decoder.model.decoder.layers.11.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 7.0, 9.0, 19.0, 25.0, 37.0, 67.0, 100.0, 155.0, 278.0, 462.0, 825.0, 1725.0, 3613.0, 8335.0, 21661.0, 62900.0, 189093.0, 571053.0, 1453226.0, 1192073.0, 446588.0, 151848.0, 53528.0, 20920.0, 8803.0, 3763.0, 1600.0, 750.0, 354.0, 202.0, 105.0, 60.0, 50.0, 18.0, 8.0, 10.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.25, -21.630126953125, -21.01025390625, -20.390380859375, -19.7705078125, -19.150634765625, -18.53076171875, -17.910888671875, -17.291015625, -16.671142578125, -16.05126953125, -15.431396484375, -14.8115234375, -14.191650390625, -13.57177734375, -12.951904296875, -12.33203125, -11.712158203125, -11.09228515625, -10.472412109375, -9.8525390625, -9.232666015625, -8.61279296875, -7.992919921875, -7.373046875, -6.753173828125, -6.13330078125, -5.513427734375, -4.8935546875, -4.273681640625, -3.65380859375, -3.033935546875, -2.4140625, -1.794189453125, -1.17431640625, -0.554443359375, 0.0654296875, 0.685302734375, 1.30517578125, 1.925048828125, 2.544921875, 3.164794921875, 3.78466796875, 4.404541015625, 5.0244140625, 5.644287109375, 6.26416015625, 6.884033203125, 7.50390625, 8.123779296875, 8.74365234375, 9.363525390625, 9.9833984375, 10.603271484375, 11.22314453125, 11.843017578125, 12.462890625, 13.082763671875, 13.70263671875, 14.322509765625, 14.9423828125, 15.562255859375, 16.18212890625, 16.802001953125, 17.421875]}, "gradients/decoder.model.decoder.layers.11.fc2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 5.0, 3.0, 3.0, 6.0, 6.0, 6.0, 10.0, 8.0, 15.0, 20.0, 21.0, 31.0, 30.0, 34.0, 37.0, 45.0, 44.0, 50.0, 47.0, 50.0, 54.0, 53.0, 63.0, 60.0, 49.0, 43.0, 42.0, 38.0, 25.0, 27.0, 16.0, 13.0, 14.0, 11.0, 8.0, 2.0, 5.0, 6.0, 6.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0], "bins": [-33.28125, -32.43359375, -31.5859375, -30.73828125, -29.890625, -29.04296875, -28.1953125, -27.34765625, -26.5, -25.65234375, -24.8046875, -23.95703125, -23.109375, -22.26171875, -21.4140625, -20.56640625, -19.71875, -18.87109375, -18.0234375, -17.17578125, -16.328125, -15.48046875, -14.6328125, -13.78515625, -12.9375, -12.08984375, -11.2421875, -10.39453125, -9.546875, -8.69921875, -7.8515625, -7.00390625, -6.15625, -5.30859375, -4.4609375, -3.61328125, -2.765625, -1.91796875, -1.0703125, -0.22265625, 0.625, 1.47265625, 2.3203125, 3.16796875, 4.015625, 4.86328125, 5.7109375, 6.55859375, 7.40625, 8.25390625, 9.1015625, 9.94921875, 10.796875, 11.64453125, 12.4921875, 13.33984375, 14.1875, 15.03515625, 15.8828125, 16.73046875, 17.578125, 18.42578125, 19.2734375, 20.12109375, 20.96875]}, "gradients/decoder.model.decoder.layers.11.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 11.0, 26.0, 91.0, 557.0, 4192412.0, 996.0, 129.0, 33.0, 16.0, 6.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1524.0, -1486.4765625, -1448.953125, -1411.4296875, -1373.90625, -1336.3828125, -1298.859375, -1261.3359375, -1223.8125, -1186.2890625, -1148.765625, -1111.2421875, -1073.71875, -1036.1953125, -998.671875, -961.1484375, -923.625, -886.1015625, -848.578125, -811.0546875, -773.53125, -736.0078125, -698.484375, -660.9609375, -623.4375, -585.9140625, -548.390625, -510.8671875, -473.34375, -435.8203125, -398.296875, -360.7734375, -323.25, -285.7265625, -248.203125, -210.6796875, -173.15625, -135.6328125, -98.109375, -60.5859375, -23.0625, 14.4609375, 51.984375, 89.5078125, 127.03125, 164.5546875, 202.078125, 239.6015625, 277.125, 314.6484375, 352.171875, 389.6953125, 427.21875, 464.7421875, 502.265625, 539.7890625, 577.3125, 614.8359375, 652.359375, 689.8828125, 727.40625, 764.9296875, 802.453125, 839.9765625, 877.5]}, "gradients/decoder.model.decoder.layers.11.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 11.0, 23.0, 48.0, 179.0, 751.0, 2264.0, 572.0, 141.0, 51.0, 14.0, 13.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.28125, -37.169921875, -36.05859375, -34.947265625, -33.8359375, -32.724609375, -31.61328125, -30.501953125, -29.390625, -28.279296875, -27.16796875, -26.056640625, -24.9453125, -23.833984375, -22.72265625, -21.611328125, -20.5, -19.388671875, -18.27734375, -17.166015625, -16.0546875, -14.943359375, -13.83203125, -12.720703125, -11.609375, -10.498046875, -9.38671875, -8.275390625, -7.1640625, -6.052734375, -4.94140625, -3.830078125, -2.71875, -1.607421875, -0.49609375, 0.615234375, 1.7265625, 2.837890625, 3.94921875, 5.060546875, 6.171875, 7.283203125, 8.39453125, 9.505859375, 10.6171875, 11.728515625, 12.83984375, 13.951171875, 15.0625, 16.173828125, 17.28515625, 18.396484375, 19.5078125, 20.619140625, 21.73046875, 22.841796875, 23.953125, 25.064453125, 26.17578125, 27.287109375, 28.3984375, 29.509765625, 30.62109375, 31.732421875, 32.84375]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 105.0, 577.0, 292.0, 31.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.02769470214844, -207.03399658203125, -200.04029846191406, -193.04660034179688, -186.05288696289062, -179.05918884277344, -172.06549072265625, -165.07179260253906, -158.07809448242188, -151.0843963623047, -144.0906982421875, -137.09698486328125, -130.10328674316406, -123.10958862304688, -116.11589050292969, -109.1221923828125, -102.12847900390625, -95.13478088378906, -88.14107513427734, -81.14737701416016, -74.15367126464844, -67.15997314453125, -60.16627502441406, -53.17257308959961, -46.178871154785156, -39.1851692199707, -32.19146728515625, -25.197769165039062, -18.20406723022461, -11.210365295410156, -4.216667175292969, 2.7770347595214844, 9.770721435546875, 16.764423370361328, 23.75812339782715, 30.75182342529297, 37.74552536010742, 44.739227294921875, 51.73292541503906, 58.726627349853516, 65.72032928466797, 72.71402740478516, 79.70773315429688, 86.70143127441406, 93.69512939453125, 100.68883514404297, 107.68253326416016, 114.67623901367188, 121.66993713378906, 128.66363525390625, 135.65733337402344, 142.65103149414062, 149.64474487304688, 156.63844299316406, 163.63214111328125, 170.62583923339844, 177.61953735351562, 184.6132354736328, 191.60693359375, 198.60064697265625, 205.59434509277344, 212.58804321289062, 219.5817413330078, 226.575439453125, 233.56915283203125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 7.0, 9.0, 15.0, 21.0, 24.0, 46.0, 73.0, 75.0, 73.0, 91.0, 93.0, 108.0, 86.0, 75.0, 78.0, 48.0, 42.0, 20.0, 11.0, 12.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.15765380859375, -51.66022491455078, -50.16279983520508, -48.66537094116211, -47.167945861816406, -45.67051696777344, -44.173091888427734, -42.675662994384766, -41.17823791503906, -39.680809020996094, -38.18338394165039, -36.68595504760742, -35.18852996826172, -33.69110107421875, -32.19367599487305, -30.696247100830078, -29.198820114135742, -27.701393127441406, -26.20396614074707, -24.706539154052734, -23.2091121673584, -21.711685180664062, -20.214256286621094, -18.71683120727539, -17.219402313232422, -15.721975326538086, -14.22454833984375, -12.727121353149414, -11.229694366455078, -9.732267379760742, -8.23483943939209, -6.737412452697754, -5.239986419677734, -3.7425594329833984, -2.2451322078704834, -0.7477049827575684, 0.7497220039367676, 2.2471489906311035, 3.7445764541625977, 5.242003440856934, 6.7394304275512695, 8.236857414245605, 9.734284400939941, 11.231712341308594, 12.72913932800293, 14.226566314697266, 15.723993301391602, 17.221420288085938, 18.718847274780273, 20.21627426147461, 21.713701248168945, 23.21112823486328, 24.708555221557617, 26.205982208251953, 27.703411102294922, 29.200836181640625, 30.698265075683594, 32.19569396972656, 33.693119049072266, 35.190547943115234, 36.68797302246094, 38.185401916503906, 39.68282699584961, 41.18025588989258, 42.67768096923828]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 0.0, 3.0, 3.0, 5.0, 9.0, 5.0, 10.0, 15.0, 23.0, 30.0, 51.0, 85.0, 171.0, 332.0, 911.0, 3192.0, 17255.0, 144752.0, 632343.0, 217904.0, 25197.0, 4271.0, 1124.0, 418.0, 180.0, 91.0, 60.0, 39.0, 21.0, 22.0, 11.0, 9.0, 6.0, 3.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.25, -10.8565673828125, -10.463134765625, -10.0697021484375, -9.67626953125, -9.2828369140625, -8.889404296875, -8.4959716796875, -8.1025390625, -7.7091064453125, -7.315673828125, -6.9222412109375, -6.52880859375, -6.1353759765625, -5.741943359375, -5.3485107421875, -4.955078125, -4.5616455078125, -4.168212890625, -3.7747802734375, -3.38134765625, -2.9879150390625, -2.594482421875, -2.2010498046875, -1.8076171875, -1.4141845703125, -1.020751953125, -0.6273193359375, -0.23388671875, 0.1595458984375, 0.552978515625, 0.9464111328125, 1.33984375, 1.7332763671875, 2.126708984375, 2.5201416015625, 2.91357421875, 3.3070068359375, 3.700439453125, 4.0938720703125, 4.4873046875, 4.8807373046875, 5.274169921875, 5.6676025390625, 6.06103515625, 6.4544677734375, 6.847900390625, 7.2413330078125, 7.634765625, 8.0281982421875, 8.421630859375, 8.8150634765625, 9.20849609375, 9.6019287109375, 9.995361328125, 10.3887939453125, 10.7822265625, 11.1756591796875, 11.569091796875, 11.9625244140625, 12.35595703125, 12.7493896484375, 13.142822265625, 13.5362548828125, 13.9296875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 11.0, 19.0, 29.0, 51.0, 97.0, 80.0, 116.0, 126.0, 144.0, 106.0, 91.0, 70.0, 35.0, 15.0, 8.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.65625, -60.099609375, -58.54296875, -56.986328125, -55.4296875, -53.873046875, -52.31640625, -50.759765625, -49.203125, -47.646484375, -46.08984375, -44.533203125, -42.9765625, -41.419921875, -39.86328125, -38.306640625, -36.75, -35.193359375, -33.63671875, -32.080078125, -30.5234375, -28.966796875, -27.41015625, -25.853515625, -24.296875, -22.740234375, -21.18359375, -19.626953125, -18.0703125, -16.513671875, -14.95703125, -13.400390625, -11.84375, -10.287109375, -8.73046875, -7.173828125, -5.6171875, -4.060546875, -2.50390625, -0.947265625, 0.609375, 2.166015625, 3.72265625, 5.279296875, 6.8359375, 8.392578125, 9.94921875, 11.505859375, 13.0625, 14.619140625, 16.17578125, 17.732421875, 19.2890625, 20.845703125, 22.40234375, 23.958984375, 25.515625, 27.072265625, 28.62890625, 30.185546875, 31.7421875, 33.298828125, 34.85546875, 36.412109375, 37.96875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 8.0, 10.0, 17.0, 37.0, 64.0, 116.0, 189.0, 301.0, 582.0, 1106.0, 2134.0, 4266.0, 8694.0, 18745.0, 42104.0, 98667.0, 208469.0, 289703.0, 203048.0, 94435.0, 40450.0, 18210.0, 8429.0, 4157.0, 2119.0, 1111.0, 586.0, 344.0, 180.0, 111.0, 57.0, 33.0, 22.0, 24.0, 14.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0], "bins": [-4.078125, -3.966339111328125, -3.85455322265625, -3.742767333984375, -3.6309814453125, -3.519195556640625, -3.40740966796875, -3.295623779296875, -3.183837890625, -3.072052001953125, -2.96026611328125, -2.848480224609375, -2.7366943359375, -2.624908447265625, -2.51312255859375, -2.401336669921875, -2.28955078125, -2.177764892578125, -2.06597900390625, -1.954193115234375, -1.8424072265625, -1.730621337890625, -1.61883544921875, -1.507049560546875, -1.395263671875, -1.283477783203125, -1.17169189453125, -1.059906005859375, -0.9481201171875, -0.836334228515625, -0.72454833984375, -0.612762451171875, -0.5009765625, -0.389190673828125, -0.27740478515625, -0.165618896484375, -0.0538330078125, 0.057952880859375, 0.16973876953125, 0.281524658203125, 0.393310546875, 0.505096435546875, 0.61688232421875, 0.728668212890625, 0.8404541015625, 0.952239990234375, 1.06402587890625, 1.175811767578125, 1.28759765625, 1.399383544921875, 1.51116943359375, 1.622955322265625, 1.7347412109375, 1.846527099609375, 1.95831298828125, 2.070098876953125, 2.181884765625, 2.293670654296875, 2.40545654296875, 2.517242431640625, 2.6290283203125, 2.740814208984375, 2.85260009765625, 2.964385986328125, 3.076171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 2.0, 7.0, 7.0, 5.0, 12.0, 9.0, 23.0, 20.0, 27.0, 35.0, 30.0, 33.0, 46.0, 65.0, 49.0, 59.0, 47.0, 58.0, 47.0, 41.0, 59.0, 39.0, 43.0, 47.0, 25.0, 29.0, 15.0, 22.0, 26.0, 14.0, 18.0, 12.0, 7.0, 3.0, 4.0, 6.0, 6.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-48.75, -47.39404296875, -46.0380859375, -44.68212890625, -43.326171875, -41.97021484375, -40.6142578125, -39.25830078125, -37.90234375, -36.54638671875, -35.1904296875, -33.83447265625, -32.478515625, -31.12255859375, -29.7666015625, -28.41064453125, -27.0546875, -25.69873046875, -24.3427734375, -22.98681640625, -21.630859375, -20.27490234375, -18.9189453125, -17.56298828125, -16.20703125, -14.85107421875, -13.4951171875, -12.13916015625, -10.783203125, -9.42724609375, -8.0712890625, -6.71533203125, -5.359375, -4.00341796875, -2.6474609375, -1.29150390625, 0.064453125, 1.42041015625, 2.7763671875, 4.13232421875, 5.48828125, 6.84423828125, 8.2001953125, 9.55615234375, 10.912109375, 12.26806640625, 13.6240234375, 14.97998046875, 16.3359375, 17.69189453125, 19.0478515625, 20.40380859375, 21.759765625, 23.11572265625, 24.4716796875, 25.82763671875, 27.18359375, 28.53955078125, 29.8955078125, 31.25146484375, 32.607421875, 33.96337890625, 35.3193359375, 36.67529296875, 38.03125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 0.0, 5.0, 8.0, 8.0, 17.0, 11.0, 32.0, 36.0, 66.0, 113.0, 180.0, 259.0, 479.0, 888.0, 1622.0, 3372.0, 7489.0, 19399.0, 64489.0, 305636.0, 475923.0, 118173.0, 29892.0, 10828.0, 4612.0, 2288.0, 1093.0, 675.0, 360.0, 242.0, 125.0, 74.0, 51.0, 32.0, 27.0, 16.0, 12.0, 10.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7646484375, -0.73846435546875, -0.7122802734375, -0.68609619140625, -0.659912109375, -0.63372802734375, -0.6075439453125, -0.58135986328125, -0.55517578125, -0.52899169921875, -0.5028076171875, -0.47662353515625, -0.450439453125, -0.42425537109375, -0.3980712890625, -0.37188720703125, -0.345703125, -0.31951904296875, -0.2933349609375, -0.26715087890625, -0.240966796875, -0.21478271484375, -0.1885986328125, -0.16241455078125, -0.13623046875, -0.11004638671875, -0.0838623046875, -0.05767822265625, -0.031494140625, -0.00531005859375, 0.0208740234375, 0.04705810546875, 0.0732421875, 0.09942626953125, 0.1256103515625, 0.15179443359375, 0.177978515625, 0.20416259765625, 0.2303466796875, 0.25653076171875, 0.28271484375, 0.30889892578125, 0.3350830078125, 0.36126708984375, 0.387451171875, 0.41363525390625, 0.4398193359375, 0.46600341796875, 0.4921875, 0.51837158203125, 0.5445556640625, 0.57073974609375, 0.596923828125, 0.62310791015625, 0.6492919921875, 0.67547607421875, 0.70166015625, 0.72784423828125, 0.7540283203125, 0.78021240234375, 0.806396484375, 0.83258056640625, 0.8587646484375, 0.88494873046875, 0.9111328125]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 7.0, 15.0, 7.0, 20.0, 18.0, 33.0, 36.0, 40.0, 60.0, 68.0, 82.0, 91.0, 85.0, 84.0, 67.0, 68.0, 43.0, 35.0, 37.0, 29.0, 9.0, 17.0, 10.0, 6.0, 5.0, 6.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000507354736328125, -0.0004939921200275421, -0.00048062950372695923, -0.00046726688742637634, -0.00045390427112579346, -0.00044054165482521057, -0.0004271790385246277, -0.0004138164222240448, -0.0004004538059234619, -0.00038709118962287903, -0.00037372857332229614, -0.00036036595702171326, -0.00034700334072113037, -0.0003336407244205475, -0.0003202781081199646, -0.0003069154918193817, -0.00029355287551879883, -0.00028019025921821594, -0.00026682764291763306, -0.00025346502661705017, -0.00024010241031646729, -0.0002267397940158844, -0.00021337717771530151, -0.00020001456141471863, -0.00018665194511413574, -0.00017328932881355286, -0.00015992671251296997, -0.00014656409621238708, -0.0001332014799118042, -0.00011983886361122131, -0.00010647624731063843, -9.311363101005554e-05, -7.975101470947266e-05, -6.638839840888977e-05, -5.3025782108306885e-05, -3.9663165807724e-05, -2.6300549507141113e-05, -1.2937933206558228e-05, 4.246830940246582e-07, 1.3787299394607544e-05, 2.714991569519043e-05, 4.0512531995773315e-05, 5.38751482963562e-05, 6.723776459693909e-05, 8.060038089752197e-05, 9.396299719810486e-05, 0.00010732561349868774, 0.00012068822979927063, 0.00013405084609985352, 0.0001474134624004364, 0.0001607760787010193, 0.00017413869500160217, 0.00018750131130218506, 0.00020086392760276794, 0.00021422654390335083, 0.00022758916020393372, 0.0002409517765045166, 0.0002543143928050995, 0.0002676770091056824, 0.00028103962540626526, 0.00029440224170684814, 0.00030776485800743103, 0.0003211274743080139, 0.0003344900906085968, 0.0003478527069091797]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 4.0, 10.0, 8.0, 8.0, 12.0, 11.0, 23.0, 23.0, 42.0, 64.0, 114.0, 278.0, 1913.0, 35014.0, 982262.0, 26606.0, 1566.0, 291.0, 104.0, 50.0, 44.0, 20.0, 17.0, 6.0, 7.0, 7.0, 5.0, 13.0, 8.0, 3.0, 1.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.12109375, -3.9901123046875, -3.859130859375, -3.7281494140625, -3.59716796875, -3.4661865234375, -3.335205078125, -3.2042236328125, -3.0732421875, -2.9422607421875, -2.811279296875, -2.6802978515625, -2.54931640625, -2.4183349609375, -2.287353515625, -2.1563720703125, -2.025390625, -1.8944091796875, -1.763427734375, -1.6324462890625, -1.50146484375, -1.3704833984375, -1.239501953125, -1.1085205078125, -0.9775390625, -0.8465576171875, -0.715576171875, -0.5845947265625, -0.45361328125, -0.3226318359375, -0.191650390625, -0.0606689453125, 0.0703125, 0.2012939453125, 0.332275390625, 0.4632568359375, 0.59423828125, 0.7252197265625, 0.856201171875, 0.9871826171875, 1.1181640625, 1.2491455078125, 1.380126953125, 1.5111083984375, 1.64208984375, 1.7730712890625, 1.904052734375, 2.0350341796875, 2.166015625, 2.2969970703125, 2.427978515625, 2.5589599609375, 2.68994140625, 2.8209228515625, 2.951904296875, 3.0828857421875, 3.2138671875, 3.3448486328125, 3.475830078125, 3.6068115234375, 3.73779296875, 3.8687744140625, 3.999755859375, 4.1307373046875, 4.26171875]}, "gradients/decoder.model.decoder.layers.11.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 5.0, 8.0, 7.0, 7.0, 12.0, 11.0, 16.0, 22.0, 26.0, 25.0, 44.0, 53.0, 89.0, 100.0, 112.0, 115.0, 89.0, 62.0, 41.0, 30.0, 31.0, 25.0, 11.0, 9.0, 4.0, 9.0, 7.0, 6.0, 6.0, 10.0, 0.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.434326171875, -0.4206390380859375, -0.406951904296875, -0.3932647705078125, -0.37957763671875, -0.3658905029296875, -0.352203369140625, -0.3385162353515625, -0.3248291015625, -0.3111419677734375, -0.297454833984375, -0.2837677001953125, -0.27008056640625, -0.2563934326171875, -0.242706298828125, -0.2290191650390625, -0.21533203125, -0.2016448974609375, -0.187957763671875, -0.1742706298828125, -0.16058349609375, -0.1468963623046875, -0.133209228515625, -0.1195220947265625, -0.1058349609375, -0.0921478271484375, -0.078460693359375, -0.0647735595703125, -0.05108642578125, -0.0373992919921875, -0.023712158203125, -0.0100250244140625, 0.003662109375, 0.0173492431640625, 0.031036376953125, 0.0447235107421875, 0.05841064453125, 0.0720977783203125, 0.085784912109375, 0.0994720458984375, 0.1131591796875, 0.1268463134765625, 0.140533447265625, 0.1542205810546875, 0.16790771484375, 0.1815948486328125, 0.195281982421875, 0.2089691162109375, 0.22265625, 0.2363433837890625, 0.250030517578125, 0.2637176513671875, 0.27740478515625, 0.2910919189453125, 0.304779052734375, 0.3184661865234375, 0.3321533203125, 0.3458404541015625, 0.359527587890625, 0.3732147216796875, 0.38690185546875, 0.4005889892578125, 0.414276123046875, 0.4279632568359375, 0.441650390625]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 110.0, 849.0, 52.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-480.8503723144531, -471.10443115234375, -461.3584899902344, -451.612548828125, -441.8665771484375, -432.1206359863281, -422.37469482421875, -412.6287536621094, -402.8828125, -393.1368713378906, -383.39093017578125, -373.64495849609375, -363.8990173339844, -354.153076171875, -344.4071350097656, -334.66119384765625, -324.91522216796875, -315.1692810058594, -305.42333984375, -295.6773681640625, -285.9314270019531, -276.18548583984375, -266.4395446777344, -256.693603515625, -246.94766235351562, -237.20172119140625, -227.4557647705078, -217.70982360839844, -207.96388244628906, -198.21792602539062, -188.47198486328125, -178.72604370117188, -168.98008728027344, -159.23414611816406, -149.48818969726562, -139.74224853515625, -129.99630737304688, -120.25035858154297, -110.50440979003906, -100.75846862792969, -91.01251983642578, -81.26657104492188, -71.5206298828125, -61.774681091308594, -52.02873611450195, -42.28279113769531, -32.536842346191406, -22.79090118408203, -13.044952392578125, -3.299006462097168, 6.446939468383789, 16.192886352539062, 25.938831329345703, 35.684776306152344, 45.43072509765625, 55.176666259765625, 64.92261505126953, 74.66856384277344, 84.41450500488281, 94.16045379638672, 103.90640258789062, 113.65234375, 123.3982925415039, 133.14422607421875, 142.8901824951172]}, "gradients/decoder.model.decoder.layers.11.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 8.0, 13.0, 29.0, 28.0, 58.0, 94.0, 104.0, 110.0, 124.0, 149.0, 87.0, 101.0, 47.0, 30.0, 10.0, 9.0, 7.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.32072830200195, -57.8126106262207, -56.30449295043945, -54.7963752746582, -53.28825759887695, -51.7801399230957, -50.27202224731445, -48.7639045715332, -47.25578689575195, -45.7476692199707, -44.23955154418945, -42.7314338684082, -41.22331619262695, -39.7151985168457, -38.20708084106445, -36.6989631652832, -35.19084548950195, -33.6827278137207, -32.17461013793945, -30.666492462158203, -29.158374786376953, -27.650257110595703, -26.142139434814453, -24.634021759033203, -23.125904083251953, -21.617786407470703, -20.109668731689453, -18.601551055908203, -17.093433380126953, -15.585315704345703, -14.077198028564453, -12.569080352783203, -11.060966491699219, -9.552848815917969, -8.044731140136719, -6.536613464355469, -5.028495788574219, -3.5203781127929688, -2.0122604370117188, -0.5041427612304688, 1.0039749145507812, 2.5120925903320312, 4.020210266113281, 5.528327941894531, 7.036445617675781, 8.544563293457031, 10.052680969238281, 11.560798645019531, 13.068916320800781, 14.577033996582031, 16.08515167236328, 17.59326934814453, 19.10138702392578, 20.60950469970703, 22.11762237548828, 23.62574005126953, 25.13385772705078, 26.64197540283203, 28.15009307861328, 29.65821075439453, 31.16632843017578, 32.67444610595703, 34.18256378173828, 35.69068145751953, 37.19879913330078]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 5.0, 2.0, 2.0, 4.0, 4.0, 8.0, 15.0, 20.0, 16.0, 28.0, 32.0, 80.0, 143.0, 284.0, 723.0, 2073.0, 6428.0, 23459.0, 105639.0, 430875.0, 368729.0, 83096.0, 18566.0, 5356.0, 1766.0, 621.0, 280.0, 122.0, 59.0, 37.0, 24.0, 19.0, 9.0, 7.0, 6.0, 3.0, 6.0, 4.0, 6.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.40625, -11.0489501953125, -10.691650390625, -10.3343505859375, -9.97705078125, -9.6197509765625, -9.262451171875, -8.9051513671875, -8.5478515625, -8.1905517578125, -7.833251953125, -7.4759521484375, -7.11865234375, -6.7613525390625, -6.404052734375, -6.0467529296875, -5.689453125, -5.3321533203125, -4.974853515625, -4.6175537109375, -4.26025390625, -3.9029541015625, -3.545654296875, -3.1883544921875, -2.8310546875, -2.4737548828125, -2.116455078125, -1.7591552734375, -1.40185546875, -1.0445556640625, -0.687255859375, -0.3299560546875, 0.02734375, 0.3846435546875, 0.741943359375, 1.0992431640625, 1.45654296875, 1.8138427734375, 2.171142578125, 2.5284423828125, 2.8857421875, 3.2430419921875, 3.600341796875, 3.9576416015625, 4.31494140625, 4.6722412109375, 5.029541015625, 5.3868408203125, 5.744140625, 6.1014404296875, 6.458740234375, 6.8160400390625, 7.17333984375, 7.5306396484375, 7.887939453125, 8.2452392578125, 8.6025390625, 8.9598388671875, 9.317138671875, 9.6744384765625, 10.03173828125, 10.3890380859375, 10.746337890625, 11.1036376953125, 11.4609375]}, "gradients/decoder.model.decoder.layers.11.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 6.0, 5.0, 10.0, 14.0, 27.0, 28.0, 43.0, 59.0, 68.0, 96.0, 100.0, 109.0, 99.0, 86.0, 70.0, 66.0, 54.0, 32.0, 20.0, 14.0, 5.0, 3.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.25, -88.99755859375, -86.7451171875, -84.49267578125, -82.240234375, -79.98779296875, -77.7353515625, -75.48291015625, -73.23046875, -70.97802734375, -68.7255859375, -66.47314453125, -64.220703125, -61.96826171875, -59.7158203125, -57.46337890625, -55.2109375, -52.95849609375, -50.7060546875, -48.45361328125, -46.201171875, -43.94873046875, -41.6962890625, -39.44384765625, -37.19140625, -34.93896484375, -32.6865234375, -30.43408203125, -28.181640625, -25.92919921875, -23.6767578125, -21.42431640625, -19.171875, -16.91943359375, -14.6669921875, -12.41455078125, -10.162109375, -7.90966796875, -5.6572265625, -3.40478515625, -1.15234375, 1.10009765625, 3.3525390625, 5.60498046875, 7.857421875, 10.10986328125, 12.3623046875, 14.61474609375, 16.8671875, 19.11962890625, 21.3720703125, 23.62451171875, 25.876953125, 28.12939453125, 30.3818359375, 32.63427734375, 34.88671875, 37.13916015625, 39.3916015625, 41.64404296875, 43.896484375, 46.14892578125, 48.4013671875, 50.65380859375, 52.90625]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 5.0, 18.0, 17.0, 23.0, 21.0, 30.0, 47.0, 56.0, 77.0, 101.0, 161.0, 206.0, 319.0, 788.0, 2678.0, 24266.0, 582751.0, 416152.0, 16947.0, 2173.0, 651.0, 331.0, 201.0, 146.0, 100.0, 59.0, 55.0, 41.0, 26.0, 20.0, 21.0, 11.0, 15.0, 1.0, 7.0, 4.0, 2.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-23.109375, -22.33740234375, -21.5654296875, -20.79345703125, -20.021484375, -19.24951171875, -18.4775390625, -17.70556640625, -16.93359375, -16.16162109375, -15.3896484375, -14.61767578125, -13.845703125, -13.07373046875, -12.3017578125, -11.52978515625, -10.7578125, -9.98583984375, -9.2138671875, -8.44189453125, -7.669921875, -6.89794921875, -6.1259765625, -5.35400390625, -4.58203125, -3.81005859375, -3.0380859375, -2.26611328125, -1.494140625, -0.72216796875, 0.0498046875, 0.82177734375, 1.59375, 2.36572265625, 3.1376953125, 3.90966796875, 4.681640625, 5.45361328125, 6.2255859375, 6.99755859375, 7.76953125, 8.54150390625, 9.3134765625, 10.08544921875, 10.857421875, 11.62939453125, 12.4013671875, 13.17333984375, 13.9453125, 14.71728515625, 15.4892578125, 16.26123046875, 17.033203125, 17.80517578125, 18.5771484375, 19.34912109375, 20.12109375, 20.89306640625, 21.6650390625, 22.43701171875, 23.208984375, 23.98095703125, 24.7529296875, 25.52490234375, 26.296875]}, "gradients/decoder.model.decoder.layers.11.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 4.0, 12.0, 18.0, 18.0, 19.0, 25.0, 34.0, 33.0, 48.0, 45.0, 56.0, 73.0, 62.0, 81.0, 69.0, 64.0, 63.0, 52.0, 48.0, 47.0, 32.0, 25.0, 19.0, 18.0, 3.0, 11.0, 9.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.75, -41.30908203125, -39.8681640625, -38.42724609375, -36.986328125, -35.54541015625, -34.1044921875, -32.66357421875, -31.22265625, -29.78173828125, -28.3408203125, -26.89990234375, -25.458984375, -24.01806640625, -22.5771484375, -21.13623046875, -19.6953125, -18.25439453125, -16.8134765625, -15.37255859375, -13.931640625, -12.49072265625, -11.0498046875, -9.60888671875, -8.16796875, -6.72705078125, -5.2861328125, -3.84521484375, -2.404296875, -0.96337890625, 0.4775390625, 1.91845703125, 3.359375, 4.80029296875, 6.2412109375, 7.68212890625, 9.123046875, 10.56396484375, 12.0048828125, 13.44580078125, 14.88671875, 16.32763671875, 17.7685546875, 19.20947265625, 20.650390625, 22.09130859375, 23.5322265625, 24.97314453125, 26.4140625, 27.85498046875, 29.2958984375, 30.73681640625, 32.177734375, 33.61865234375, 35.0595703125, 36.50048828125, 37.94140625, 39.38232421875, 40.8232421875, 42.26416015625, 43.705078125, 45.14599609375, 46.5869140625, 48.02783203125, 49.46875]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 3.0, 6.0, 6.0, 23.0, 25.0, 48.0, 39.0, 81.0, 120.0, 282.0, 656.0, 1908.0, 7803.0, 114454.0, 888006.0, 28523.0, 4348.0, 1236.0, 461.0, 202.0, 110.0, 72.0, 48.0, 23.0, 22.0, 17.0, 9.0, 5.0, 4.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.4296875, -10.13427734375, -9.8388671875, -9.54345703125, -9.248046875, -8.95263671875, -8.6572265625, -8.36181640625, -8.06640625, -7.77099609375, -7.4755859375, -7.18017578125, -6.884765625, -6.58935546875, -6.2939453125, -5.99853515625, -5.703125, -5.40771484375, -5.1123046875, -4.81689453125, -4.521484375, -4.22607421875, -3.9306640625, -3.63525390625, -3.33984375, -3.04443359375, -2.7490234375, -2.45361328125, -2.158203125, -1.86279296875, -1.5673828125, -1.27197265625, -0.9765625, -0.68115234375, -0.3857421875, -0.09033203125, 0.205078125, 0.50048828125, 0.7958984375, 1.09130859375, 1.38671875, 1.68212890625, 1.9775390625, 2.27294921875, 2.568359375, 2.86376953125, 3.1591796875, 3.45458984375, 3.75, 4.04541015625, 4.3408203125, 4.63623046875, 4.931640625, 5.22705078125, 5.5224609375, 5.81787109375, 6.11328125, 6.40869140625, 6.7041015625, 6.99951171875, 7.294921875, 7.59033203125, 7.8857421875, 8.18115234375, 8.4765625]}, "gradients/decoder.model.decoder.layers.11.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 4.0, 3.0, 4.0, 8.0, 7.0, 16.0, 16.0, 24.0, 23.0, 32.0, 48.0, 58.0, 90.0, 91.0, 102.0, 108.0, 82.0, 65.0, 77.0, 40.0, 21.0, 20.0, 10.0, 15.0, 3.0, 3.0, 1.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00063323974609375, -0.0006143525242805481, -0.0005954653024673462, -0.0005765780806541443, -0.0005576908588409424, -0.0005388036370277405, -0.0005199164152145386, -0.0005010291934013367, -0.00048214197158813477, -0.00046325474977493286, -0.00044436752796173096, -0.00042548030614852905, -0.00040659308433532715, -0.00038770586252212524, -0.00036881864070892334, -0.00034993141889572144, -0.00033104419708251953, -0.0003121569752693176, -0.0002932697534561157, -0.0002743825316429138, -0.0002554953098297119, -0.00023660808801651, -0.0002177208662033081, -0.0001988336443901062, -0.0001799464225769043, -0.0001610592007637024, -0.0001421719789505005, -0.00012328475713729858, -0.00010439753532409668, -8.551031351089478e-05, -6.662309169769287e-05, -4.773586988449097e-05, -2.8848648071289062e-05, -9.961426258087158e-06, 8.925795555114746e-06, 2.781301736831665e-05, 4.6700239181518555e-05, 6.558746099472046e-05, 8.447468280792236e-05, 0.00010336190462112427, 0.00012224912643432617, 0.00014113634824752808, 0.00016002357006072998, 0.00017891079187393188, 0.0001977980136871338, 0.0002166852355003357, 0.0002355724573135376, 0.0002544596791267395, 0.0002733469009399414, 0.0002922341227531433, 0.0003111213445663452, 0.0003300085663795471, 0.000348895788192749, 0.00036778301000595093, 0.00038667023181915283, 0.00040555745363235474, 0.00042444467544555664, 0.00044333189725875854, 0.00046221911907196045, 0.00048110634088516235, 0.0004999935626983643, 0.0005188807845115662, 0.0005377680063247681, 0.00055665522813797, 0.0005755424499511719]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 2.0, 2.0, 6.0, 10.0, 13.0, 26.0, 27.0, 46.0, 94.0, 168.0, 432.0, 1168.0, 5507.0, 52529.0, 812696.0, 162149.0, 10691.0, 1928.0, 557.0, 218.0, 108.0, 58.0, 31.0, 24.0, 19.0, 13.0, 6.0, 10.0, 4.0, 0.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.0234375, -7.79852294921875, -7.5736083984375, -7.34869384765625, -7.123779296875, -6.89886474609375, -6.6739501953125, -6.44903564453125, -6.22412109375, -5.99920654296875, -5.7742919921875, -5.54937744140625, -5.324462890625, -5.09954833984375, -4.8746337890625, -4.64971923828125, -4.4248046875, -4.19989013671875, -3.9749755859375, -3.75006103515625, -3.525146484375, -3.30023193359375, -3.0753173828125, -2.85040283203125, -2.62548828125, -2.40057373046875, -2.1756591796875, -1.95074462890625, -1.725830078125, -1.50091552734375, -1.2760009765625, -1.05108642578125, -0.826171875, -0.60125732421875, -0.3763427734375, -0.15142822265625, 0.073486328125, 0.29840087890625, 0.5233154296875, 0.74822998046875, 0.97314453125, 1.19805908203125, 1.4229736328125, 1.64788818359375, 1.872802734375, 2.09771728515625, 2.3226318359375, 2.54754638671875, 2.7724609375, 2.99737548828125, 3.2222900390625, 3.44720458984375, 3.672119140625, 3.89703369140625, 4.1219482421875, 4.34686279296875, 4.57177734375, 4.79669189453125, 5.0216064453125, 5.24652099609375, 5.471435546875, 5.69635009765625, 5.9212646484375, 6.14617919921875, 6.37109375]}, "gradients/decoder.model.decoder.layers.11.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 11.0, 10.0, 12.0, 21.0, 25.0, 32.0, 43.0, 71.0, 91.0, 121.0, 125.0, 111.0, 82.0, 65.0, 41.0, 41.0, 35.0, 11.0, 13.0, 9.0, 7.0, 5.0, 6.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.1594085693359375, -2.100067138671875, -2.0407257080078125, -1.98138427734375, -1.9220428466796875, -1.862701416015625, -1.8033599853515625, -1.7440185546875, -1.6846771240234375, -1.625335693359375, -1.5659942626953125, -1.50665283203125, -1.4473114013671875, -1.387969970703125, -1.3286285400390625, -1.269287109375, -1.2099456787109375, -1.150604248046875, -1.0912628173828125, -1.03192138671875, -0.9725799560546875, -0.913238525390625, -0.8538970947265625, -0.7945556640625, -0.7352142333984375, -0.675872802734375, -0.6165313720703125, -0.55718994140625, -0.4978485107421875, -0.438507080078125, -0.3791656494140625, -0.31982421875, -0.2604827880859375, -0.201141357421875, -0.1417999267578125, -0.08245849609375, -0.0231170654296875, 0.036224365234375, 0.0955657958984375, 0.1549072265625, 0.2142486572265625, 0.273590087890625, 0.3329315185546875, 0.39227294921875, 0.4516143798828125, 0.510955810546875, 0.5702972412109375, 0.629638671875, 0.6889801025390625, 0.748321533203125, 0.8076629638671875, 0.86700439453125, 0.9263458251953125, 0.985687255859375, 1.0450286865234375, 1.1043701171875, 1.1637115478515625, 1.223052978515625, 1.2823944091796875, 1.34173583984375, 1.4010772705078125, 1.460418701171875, 1.5197601318359375, 1.5791015625]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 375.0, 595.0, 39.0, 4.0, 0.0, 1.0], "bins": [-695.423828125, -683.652099609375, -671.8803100585938, -660.1085815429688, -648.3367919921875, -636.5650634765625, -624.7933349609375, -613.0215454101562, -601.2498168945312, -589.4780883789062, -577.706298828125, -565.9345703125, -554.1627807617188, -542.3910522460938, -530.6193237304688, -518.8475341796875, -507.0758056640625, -495.3040466308594, -483.53228759765625, -471.76055908203125, -459.9888000488281, -448.217041015625, -436.4452819824219, -424.67352294921875, -412.9017639160156, -401.1300048828125, -389.3582458496094, -377.5865173339844, -365.81475830078125, -354.0429992675781, -342.271240234375, -330.49951171875, -318.727783203125, -306.9560241699219, -295.18426513671875, -283.41253662109375, -271.6407775878906, -259.8690185546875, -248.09725952148438, -236.3255157470703, -224.55374145507812, -212.781982421875, -201.01023864746094, -189.2384796142578, -177.46673583984375, -165.69497680664062, -153.9232177734375, -142.15147399902344, -130.37973022460938, -118.60797882080078, -106.83622741699219, -95.06446838378906, -83.292724609375, -71.52096557617188, -59.74921417236328, -47.97746276855469, -36.205711364746094, -24.4339599609375, -12.662206649780273, -0.8904533386230469, 10.881298065185547, 22.65304946899414, 34.4248046875, 46.196556091308594, 57.96830749511719]}, "gradients/decoder.model.decoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 4.0, 4.0, 11.0, 16.0, 11.0, 25.0, 28.0, 41.0, 54.0, 63.0, 41.0, 62.0, 61.0, 64.0, 64.0, 61.0, 69.0, 54.0, 60.0, 48.0, 42.0, 35.0, 32.0, 19.0, 15.0, 8.0, 9.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.17243957519531, -95.64674377441406, -93.12105560302734, -90.59536743164062, -88.06967163085938, -85.54397583007812, -83.0182876586914, -80.49259948730469, -77.96690368652344, -75.44120788574219, -72.91551971435547, -70.38983154296875, -67.8641357421875, -65.33843994140625, -62.81275177001953, -60.28705978393555, -57.76136779785156, -55.23567581176758, -52.709983825683594, -50.18429183959961, -47.658599853515625, -45.13290786743164, -42.607215881347656, -40.08152389526367, -37.55583190917969, -35.0301399230957, -32.50444793701172, -29.978755950927734, -27.45306396484375, -24.927371978759766, -22.40167999267578, -19.875988006591797, -17.350303649902344, -14.82461166381836, -12.298919677734375, -9.77322769165039, -7.247535705566406, -4.721843719482422, -2.1961517333984375, 0.3295402526855469, 2.8552322387695312, 5.380924224853516, 7.9066162109375, 10.432308197021484, 12.958000183105469, 15.483692169189453, 18.009384155273438, 20.535076141357422, 23.060768127441406, 25.58646011352539, 28.112152099609375, 30.63784408569336, 33.163536071777344, 35.68922805786133, 38.21492004394531, 40.7406120300293, 43.26630401611328, 45.791996002197266, 48.31768798828125, 50.843379974365234, 53.36907196044922, 55.8947639465332, 58.42045593261719, 60.94614791870117, 63.471839904785156]}, "gradients/decoder.model.decoder.layers.10.fc2.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 5.0, 5.0, 4.0, 5.0, 13.0, 9.0, 19.0, 25.0, 35.0, 61.0, 79.0, 146.0, 295.0, 1100.0, 5919.0, 45681.0, 825489.0, 2980874.0, 308027.0, 19617.0, 2847.0, 903.0, 669.0, 749.0, 655.0, 520.0, 317.0, 151.0, 43.0, 9.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-48.03125, -46.70947265625, -45.3876953125, -44.06591796875, -42.744140625, -41.42236328125, -40.1005859375, -38.77880859375, -37.45703125, -36.13525390625, -34.8134765625, -33.49169921875, -32.169921875, -30.84814453125, -29.5263671875, -28.20458984375, -26.8828125, -25.56103515625, -24.2392578125, -22.91748046875, -21.595703125, -20.27392578125, -18.9521484375, -17.63037109375, -16.30859375, -14.98681640625, -13.6650390625, -12.34326171875, -11.021484375, -9.69970703125, -8.3779296875, -7.05615234375, -5.734375, -4.41259765625, -3.0908203125, -1.76904296875, -0.447265625, 0.87451171875, 2.1962890625, 3.51806640625, 4.83984375, 6.16162109375, 7.4833984375, 8.80517578125, 10.126953125, 11.44873046875, 12.7705078125, 14.09228515625, 15.4140625, 16.73583984375, 18.0576171875, 19.37939453125, 20.701171875, 22.02294921875, 23.3447265625, 24.66650390625, 25.98828125, 27.31005859375, 28.6318359375, 29.95361328125, 31.275390625, 32.59716796875, 33.9189453125, 35.24072265625, 36.5625]}, "gradients/decoder.model.decoder.layers.10.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 10.0, 20.0, 43.0, 85.0, 158.0, 168.0, 186.0, 167.0, 108.0, 45.0, 11.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.5625, -108.30810546875, -106.0537109375, -103.79931640625, -101.544921875, -99.29052734375, -97.0361328125, -94.78173828125, -92.52734375, -90.27294921875, -88.0185546875, -85.76416015625, -83.509765625, -81.25537109375, -79.0009765625, -76.74658203125, -74.4921875, -72.23779296875, -69.9833984375, -67.72900390625, -65.474609375, -63.22021484375, -60.9658203125, -58.71142578125, -56.45703125, -54.20263671875, -51.9482421875, -49.69384765625, -47.439453125, -45.18505859375, -42.9306640625, -40.67626953125, -38.421875, -36.16748046875, -33.9130859375, -31.65869140625, -29.404296875, -27.14990234375, -24.8955078125, -22.64111328125, -20.38671875, -18.13232421875, -15.8779296875, -13.62353515625, -11.369140625, -9.11474609375, -6.8603515625, -4.60595703125, -2.3515625, -0.09716796875, 2.1572265625, 4.41162109375, 6.666015625, 8.92041015625, 11.1748046875, 13.42919921875, 15.68359375, 17.93798828125, 20.1923828125, 22.44677734375, 24.701171875, 26.95556640625, 29.2099609375, 31.46435546875, 33.71875]}, "gradients/decoder.model.decoder.layers.10.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 4.0, 5.0, 8.0, 11.0, 32.0, 76.0, 273.0, 2460.0, 4180869.0, 9793.0, 537.0, 124.0, 53.0, 15.0, 6.0, 6.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-189.5, -181.80859375, -174.1171875, -166.42578125, -158.734375, -151.04296875, -143.3515625, -135.66015625, -127.96875, -120.27734375, -112.5859375, -104.89453125, -97.203125, -89.51171875, -81.8203125, -74.12890625, -66.4375, -58.74609375, -51.0546875, -43.36328125, -35.671875, -27.98046875, -20.2890625, -12.59765625, -4.90625, 2.78515625, 10.4765625, 18.16796875, 25.859375, 33.55078125, 41.2421875, 48.93359375, 56.625, 64.31640625, 72.0078125, 79.69921875, 87.390625, 95.08203125, 102.7734375, 110.46484375, 118.15625, 125.84765625, 133.5390625, 141.23046875, 148.921875, 156.61328125, 164.3046875, 171.99609375, 179.6875, 187.37890625, 195.0703125, 202.76171875, 210.453125, 218.14453125, 225.8359375, 233.52734375, 241.21875, 248.91015625, 256.6015625, 264.29296875, 271.984375, 279.67578125, 287.3671875, 295.05859375, 302.75]}, "gradients/decoder.model.decoder.layers.10.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 9.0, 19.0, 21.0, 74.0, 208.0, 839.0, 1938.0, 680.0, 183.0, 62.0, 27.0, 9.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-23.375, -22.3779296875, -21.380859375, -20.3837890625, -19.38671875, -18.3896484375, -17.392578125, -16.3955078125, -15.3984375, -14.4013671875, -13.404296875, -12.4072265625, -11.41015625, -10.4130859375, -9.416015625, -8.4189453125, -7.421875, -6.4248046875, -5.427734375, -4.4306640625, -3.43359375, -2.4365234375, -1.439453125, -0.4423828125, 0.5546875, 1.5517578125, 2.548828125, 3.5458984375, 4.54296875, 5.5400390625, 6.537109375, 7.5341796875, 8.53125, 9.5283203125, 10.525390625, 11.5224609375, 12.51953125, 13.5166015625, 14.513671875, 15.5107421875, 16.5078125, 17.5048828125, 18.501953125, 19.4990234375, 20.49609375, 21.4931640625, 22.490234375, 23.4873046875, 24.484375, 25.4814453125, 26.478515625, 27.4755859375, 28.47265625, 29.4697265625, 30.466796875, 31.4638671875, 32.4609375, 33.4580078125, 34.455078125, 35.4521484375, 36.44921875, 37.4462890625, 38.443359375, 39.4404296875, 40.4375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 13.0, 94.0, 389.0, 363.0, 123.0, 20.0, 7.0, 4.0, 1.0, 2.0, 2.0], "bins": [-243.615966796875, -239.26756286621094, -234.91915893554688, -230.57077026367188, -226.2223663330078, -221.87396240234375, -217.52557373046875, -213.1771697998047, -208.82876586914062, -204.48036193847656, -200.1319580078125, -195.7835693359375, -191.43516540527344, -187.08676147460938, -182.73837280273438, -178.3899688720703, -174.04156494140625, -169.6931610107422, -165.34475708007812, -160.99636840820312, -156.64796447753906, -152.299560546875, -147.951171875, -143.60276794433594, -139.25436401367188, -134.9059600830078, -130.55755615234375, -126.20916748046875, -121.86076354980469, -117.51235961914062, -113.1639633178711, -108.81556701660156, -104.4671630859375, -100.11875915527344, -95.7703628540039, -91.42196655273438, -87.07356262207031, -82.72515869140625, -78.37676239013672, -74.02836608886719, -69.67996215820312, -65.33155822753906, -60.98316192626953, -56.634761810302734, -52.28636169433594, -47.93796157836914, -43.589561462402344, -39.24116134643555, -34.89276123046875, -30.544361114501953, -26.195960998535156, -21.84756088256836, -17.499160766601562, -13.150760650634766, -8.802360534667969, -4.453960418701172, -0.105560302734375, 4.242839813232422, 8.591239929199219, 12.939640045166016, 17.288040161132812, 21.63644027709961, 25.984840393066406, 30.333240509033203, 34.681640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 11.0, 14.0, 19.0, 30.0, 55.0, 69.0, 77.0, 89.0, 115.0, 118.0, 95.0, 100.0, 75.0, 50.0, 39.0, 31.0, 13.0, 5.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.84228515625, -70.28286743164062, -68.72344970703125, -67.1640396118164, -65.60462188720703, -64.04520416259766, -62.48579025268555, -60.92637634277344, -59.36695861816406, -57.80754089355469, -56.24812698364258, -54.68871307373047, -53.129295349121094, -51.56987762451172, -50.01046371459961, -48.4510498046875, -46.891632080078125, -45.33221435546875, -43.77280044555664, -42.21338653564453, -40.653968811035156, -39.09455108642578, -37.53513717651367, -35.97572326660156, -34.41630554199219, -32.85688781738281, -31.297473907470703, -29.73805809020996, -28.17864227294922, -26.619226455688477, -25.059810638427734, -23.500394821166992, -21.940980911254883, -20.38156509399414, -18.8221492767334, -17.262733459472656, -15.703317642211914, -14.143901824951172, -12.58448600769043, -11.025070190429688, -9.465654373168945, -7.906238555908203, -6.346822738647461, -4.787406921386719, -3.2279911041259766, -1.6685752868652344, -0.10915946960449219, 1.45025634765625, 3.009672164916992, 4.569087982177734, 6.128503799438477, 7.687919616699219, 9.247335433959961, 10.806751251220703, 12.366167068481445, 13.925582885742188, 15.48499870300293, 17.044414520263672, 18.603830337524414, 20.163246154785156, 21.7226619720459, 23.28207778930664, 24.841493606567383, 26.400909423828125, 27.960325241088867]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 5.0, 13.0, 29.0, 44.0, 81.0, 196.0, 537.0, 1604.0, 7511.0, 202983.0, 799040.0, 31806.0, 3203.0, 924.0, 303.0, 113.0, 68.0, 42.0, 15.0, 7.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.5625, -17.034423828125, -16.50634765625, -15.978271484375, -15.4501953125, -14.922119140625, -14.39404296875, -13.865966796875, -13.337890625, -12.809814453125, -12.28173828125, -11.753662109375, -11.2255859375, -10.697509765625, -10.16943359375, -9.641357421875, -9.11328125, -8.585205078125, -8.05712890625, -7.529052734375, -7.0009765625, -6.472900390625, -5.94482421875, -5.416748046875, -4.888671875, -4.360595703125, -3.83251953125, -3.304443359375, -2.7763671875, -2.248291015625, -1.72021484375, -1.192138671875, -0.6640625, -0.135986328125, 0.39208984375, 0.920166015625, 1.4482421875, 1.976318359375, 2.50439453125, 3.032470703125, 3.560546875, 4.088623046875, 4.61669921875, 5.144775390625, 5.6728515625, 6.200927734375, 6.72900390625, 7.257080078125, 7.78515625, 8.313232421875, 8.84130859375, 9.369384765625, 9.8974609375, 10.425537109375, 10.95361328125, 11.481689453125, 12.009765625, 12.537841796875, 13.06591796875, 13.593994140625, 14.1220703125, 14.650146484375, 15.17822265625, 15.706298828125, 16.234375]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 10.0, 18.0, 37.0, 51.0, 77.0, 95.0, 105.0, 131.0, 124.0, 119.0, 81.0, 62.0, 45.0, 25.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.6875, -61.3447265625, -60.001953125, -58.6591796875, -57.31640625, -55.9736328125, -54.630859375, -53.2880859375, -51.9453125, -50.6025390625, -49.259765625, -47.9169921875, -46.57421875, -45.2314453125, -43.888671875, -42.5458984375, -41.203125, -39.8603515625, -38.517578125, -37.1748046875, -35.83203125, -34.4892578125, -33.146484375, -31.8037109375, -30.4609375, -29.1181640625, -27.775390625, -26.4326171875, -25.08984375, -23.7470703125, -22.404296875, -21.0615234375, -19.71875, -18.3759765625, -17.033203125, -15.6904296875, -14.34765625, -13.0048828125, -11.662109375, -10.3193359375, -8.9765625, -7.6337890625, -6.291015625, -4.9482421875, -3.60546875, -2.2626953125, -0.919921875, 0.4228515625, 1.765625, 3.1083984375, 4.451171875, 5.7939453125, 7.13671875, 8.4794921875, 9.822265625, 11.1650390625, 12.5078125, 13.8505859375, 15.193359375, 16.5361328125, 17.87890625, 19.2216796875, 20.564453125, 21.9072265625, 23.25]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 6.0, 15.0, 24.0, 17.0, 50.0, 62.0, 79.0, 127.0, 200.0, 312.0, 517.0, 943.0, 1520.0, 2686.0, 4997.0, 9179.0, 17752.0, 33985.0, 68574.0, 133025.0, 213433.0, 230423.0, 158157.0, 84626.0, 42356.0, 21012.0, 10823.0, 5871.0, 3313.0, 1775.0, 1087.0, 608.0, 360.0, 250.0, 137.0, 87.0, 50.0, 38.0, 30.0, 13.0, 13.0, 6.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.251953125, -2.181915283203125, -2.11187744140625, -2.041839599609375, -1.9718017578125, -1.901763916015625, -1.83172607421875, -1.761688232421875, -1.691650390625, -1.621612548828125, -1.55157470703125, -1.481536865234375, -1.4114990234375, -1.341461181640625, -1.27142333984375, -1.201385498046875, -1.13134765625, -1.061309814453125, -0.99127197265625, -0.921234130859375, -0.8511962890625, -0.781158447265625, -0.71112060546875, -0.641082763671875, -0.571044921875, -0.501007080078125, -0.43096923828125, -0.360931396484375, -0.2908935546875, -0.220855712890625, -0.15081787109375, -0.080780029296875, -0.0107421875, 0.059295654296875, 0.12933349609375, 0.199371337890625, 0.2694091796875, 0.339447021484375, 0.40948486328125, 0.479522705078125, 0.549560546875, 0.619598388671875, 0.68963623046875, 0.759674072265625, 0.8297119140625, 0.899749755859375, 0.96978759765625, 1.039825439453125, 1.10986328125, 1.179901123046875, 1.24993896484375, 1.319976806640625, 1.3900146484375, 1.460052490234375, 1.53009033203125, 1.600128173828125, 1.670166015625, 1.740203857421875, 1.81024169921875, 1.880279541015625, 1.9503173828125, 2.020355224609375, 2.09039306640625, 2.160430908203125, 2.23046875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 9.0, 10.0, 13.0, 13.0, 22.0, 11.0, 17.0, 20.0, 26.0, 23.0, 26.0, 30.0, 38.0, 47.0, 39.0, 47.0, 51.0, 37.0, 45.0, 43.0, 52.0, 35.0, 34.0, 42.0, 27.0, 28.0, 31.0, 27.0, 23.0, 18.0, 15.0, 16.0, 14.0, 16.0, 7.0, 11.0, 7.0, 4.0, 8.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.09375, -30.138671875, -29.18359375, -28.228515625, -27.2734375, -26.318359375, -25.36328125, -24.408203125, -23.453125, -22.498046875, -21.54296875, -20.587890625, -19.6328125, -18.677734375, -17.72265625, -16.767578125, -15.8125, -14.857421875, -13.90234375, -12.947265625, -11.9921875, -11.037109375, -10.08203125, -9.126953125, -8.171875, -7.216796875, -6.26171875, -5.306640625, -4.3515625, -3.396484375, -2.44140625, -1.486328125, -0.53125, 0.423828125, 1.37890625, 2.333984375, 3.2890625, 4.244140625, 5.19921875, 6.154296875, 7.109375, 8.064453125, 9.01953125, 9.974609375, 10.9296875, 11.884765625, 12.83984375, 13.794921875, 14.75, 15.705078125, 16.66015625, 17.615234375, 18.5703125, 19.525390625, 20.48046875, 21.435546875, 22.390625, 23.345703125, 24.30078125, 25.255859375, 26.2109375, 27.166015625, 28.12109375, 29.076171875, 30.03125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 6.0, 9.0, 9.0, 13.0, 22.0, 29.0, 49.0, 62.0, 101.0, 138.0, 249.0, 404.0, 664.0, 1302.0, 2596.0, 5759.0, 15826.0, 52298.0, 223221.0, 487956.0, 188505.0, 44718.0, 13964.0, 5383.0, 2386.0, 1190.0, 704.0, 372.0, 211.0, 128.0, 77.0, 66.0, 51.0, 30.0, 16.0, 11.0, 9.0, 8.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.47412109375, -0.4590415954589844, -0.44396209716796875, -0.4288825988769531, -0.4138031005859375, -0.3987236022949219, -0.38364410400390625, -0.3685646057128906, -0.353485107421875, -0.3384056091308594, -0.32332611083984375, -0.3082466125488281, -0.2931671142578125, -0.2780876159667969, -0.26300811767578125, -0.24792861938476562, -0.23284912109375, -0.21776962280273438, -0.20269012451171875, -0.18761062622070312, -0.1725311279296875, -0.15745162963867188, -0.14237213134765625, -0.12729263305664062, -0.112213134765625, -0.09713363647460938, -0.08205413818359375, -0.06697463989257812, -0.0518951416015625, -0.036815643310546875, -0.02173614501953125, -0.006656646728515625, 0.0084228515625, 0.023502349853515625, 0.03858184814453125, 0.053661346435546875, 0.0687408447265625, 0.08382034301757812, 0.09889984130859375, 0.11397933959960938, 0.129058837890625, 0.14413833618164062, 0.15921783447265625, 0.17429733276367188, 0.1893768310546875, 0.20445632934570312, 0.21953582763671875, 0.23461532592773438, 0.24969482421875, 0.2647743225097656, 0.27985382080078125, 0.2949333190917969, 0.3100128173828125, 0.3250923156738281, 0.34017181396484375, 0.3552513122558594, 0.370330810546875, 0.3854103088378906, 0.40048980712890625, 0.4155693054199219, 0.4306488037109375, 0.4457283020019531, 0.46080780029296875, 0.4758872985839844, 0.490966796875]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 6.0, 6.0, 8.0, 9.0, 20.0, 25.0, 24.0, 46.0, 44.0, 73.0, 82.0, 90.0, 101.0, 90.0, 81.0, 61.0, 61.0, 41.0, 33.0, 28.0, 17.0, 11.0, 7.0, 8.0, 7.0, 7.0, 3.0, 4.0, 0.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00026726722717285156, -0.0002572201192378998, -0.000247173011302948, -0.00023712590336799622, -0.00022707879543304443, -0.00021703168749809265, -0.00020698457956314087, -0.0001969374716281891, -0.0001868903636932373, -0.00017684325575828552, -0.00016679614782333374, -0.00015674903988838196, -0.00014670193195343018, -0.0001366548240184784, -0.0001266077160835266, -0.00011656060814857483, -0.00010651350021362305, -9.646639227867126e-05, -8.641928434371948e-05, -7.63721764087677e-05, -6.632506847381592e-05, -5.6277960538864136e-05, -4.6230852603912354e-05, -3.618374466896057e-05, -2.613663673400879e-05, -1.6089528799057007e-05, -6.042420864105225e-06, 4.004687070846558e-06, 1.405179500579834e-05, 2.4098902940750122e-05, 3.4146010875701904e-05, 4.4193118810653687e-05, 5.424022674560547e-05, 6.428733468055725e-05, 7.433444261550903e-05, 8.438155055046082e-05, 9.44286584854126e-05, 0.00010447576642036438, 0.00011452287435531616, 0.00012456998229026794, 0.00013461709022521973, 0.0001446641981601715, 0.0001547113060951233, 0.00016475841403007507, 0.00017480552196502686, 0.00018485262989997864, 0.00019489973783493042, 0.0002049468457698822, 0.00021499395370483398, 0.00022504106163978577, 0.00023508816957473755, 0.00024513527750968933, 0.0002551823854446411, 0.0002652294933795929, 0.0002752766013145447, 0.00028532370924949646, 0.00029537081718444824, 0.0003054179251194, 0.0003154650330543518, 0.0003255121409893036, 0.00033555924892425537, 0.00034560635685920715, 0.00035565346479415894, 0.0003657005727291107, 0.0003757476806640625]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 8.0, 8.0, 20.0, 18.0, 23.0, 30.0, 53.0, 113.0, 194.0, 405.0, 909.0, 2669.0, 10029.0, 73552.0, 826464.0, 116829.0, 12320.0, 2944.0, 1000.0, 433.0, 215.0, 129.0, 64.0, 47.0, 17.0, 18.0, 11.0, 10.0, 4.0, 6.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.171875, -1.134765625, -1.09765625, -1.060546875, -1.0234375, -0.986328125, -0.94921875, -0.912109375, -0.875, -0.837890625, -0.80078125, -0.763671875, -0.7265625, -0.689453125, -0.65234375, -0.615234375, -0.578125, -0.541015625, -0.50390625, -0.466796875, -0.4296875, -0.392578125, -0.35546875, -0.318359375, -0.28125, -0.244140625, -0.20703125, -0.169921875, -0.1328125, -0.095703125, -0.05859375, -0.021484375, 0.015625, 0.052734375, 0.08984375, 0.126953125, 0.1640625, 0.201171875, 0.23828125, 0.275390625, 0.3125, 0.349609375, 0.38671875, 0.423828125, 0.4609375, 0.498046875, 0.53515625, 0.572265625, 0.609375, 0.646484375, 0.68359375, 0.720703125, 0.7578125, 0.794921875, 0.83203125, 0.869140625, 0.90625, 0.943359375, 0.98046875, 1.017578125, 1.0546875, 1.091796875, 1.12890625, 1.166015625, 1.203125]}, "gradients/decoder.model.decoder.layers.10.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 4.0, 3.0, 6.0, 13.0, 10.0, 12.0, 21.0, 30.0, 47.0, 57.0, 86.0, 101.0, 132.0, 124.0, 79.0, 73.0, 56.0, 39.0, 26.0, 15.0, 19.0, 9.0, 7.0, 6.0, 4.0, 5.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3208160400390625, -0.310333251953125, -0.2998504638671875, -0.28936767578125, -0.2788848876953125, -0.268402099609375, -0.2579193115234375, -0.2474365234375, -0.2369537353515625, -0.226470947265625, -0.2159881591796875, -0.20550537109375, -0.1950225830078125, -0.184539794921875, -0.1740570068359375, -0.16357421875, -0.1530914306640625, -0.142608642578125, -0.1321258544921875, -0.12164306640625, -0.1111602783203125, -0.100677490234375, -0.0901947021484375, -0.0797119140625, -0.0692291259765625, -0.058746337890625, -0.0482635498046875, -0.03778076171875, -0.0272979736328125, -0.016815185546875, -0.0063323974609375, 0.004150390625, 0.0146331787109375, 0.025115966796875, 0.0355987548828125, 0.04608154296875, 0.0565643310546875, 0.067047119140625, 0.0775299072265625, 0.0880126953125, 0.0984954833984375, 0.108978271484375, 0.1194610595703125, 0.12994384765625, 0.1404266357421875, 0.150909423828125, 0.1613922119140625, 0.171875, 0.1823577880859375, 0.192840576171875, 0.2033233642578125, 0.21380615234375, 0.2242889404296875, 0.234771728515625, 0.2452545166015625, 0.2557373046875, 0.2662200927734375, 0.276702880859375, 0.2871856689453125, 0.29766845703125, 0.3081512451171875, 0.318634033203125, 0.3291168212890625, 0.339599609375]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 8.0, 79.0, 436.0, 400.0, 68.0, 15.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.76638793945312, -161.4674072265625, -158.16844177246094, -154.8694610595703, -151.57049560546875, -148.27151489257812, -144.97254943847656, -141.67356872558594, -138.37460327148438, -135.07562255859375, -131.7766571044922, -128.47767639160156, -125.1787109375, -121.8797378540039, -118.58076477050781, -115.28179168701172, -111.98281860351562, -108.68384552001953, -105.38487243652344, -102.08589935302734, -98.78692626953125, -95.48795318603516, -92.18898010253906, -88.89000701904297, -85.59102630615234, -82.29205322265625, -78.99308013916016, -75.69410705566406, -72.39513397216797, -69.09616088867188, -65.79718780517578, -62.49821472167969, -59.19924545288086, -55.900272369384766, -52.60129928588867, -49.30232620239258, -46.003353118896484, -42.704376220703125, -39.40540313720703, -36.10643005371094, -32.807456970214844, -29.50848388671875, -26.209510803222656, -22.910537719726562, -19.61156463623047, -16.312589645385742, -13.013616561889648, -9.714643478393555, -6.415672302246094, -3.116698980331421, 0.18227434158325195, 3.481247901916504, 6.780220985412598, 10.079195022583008, 13.378168106079102, 16.677141189575195, 19.97611427307129, 23.275087356567383, 26.574060440063477, 29.873035430908203, 33.1720085144043, 36.47098159790039, 39.769954681396484, 43.06892776489258, 46.36790084838867]}, "gradients/decoder.model.decoder.layers.10.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 10.0, 20.0, 38.0, 54.0, 83.0, 94.0, 120.0, 145.0, 129.0, 114.0, 76.0, 45.0, 40.0, 20.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-64.99473571777344, -63.626502990722656, -62.25826644897461, -60.89003372192383, -59.52180099487305, -58.153564453125, -56.78533172607422, -55.41709899902344, -54.048866271972656, -52.680633544921875, -51.31239700317383, -49.94416427612305, -48.575931549072266, -47.20769500732422, -45.83946228027344, -44.471229553222656, -43.10299301147461, -41.73476028442383, -40.36652374267578, -38.998291015625, -37.63005828857422, -36.26182556152344, -34.89358901977539, -33.52535629272461, -32.15711975097656, -30.78888511657715, -29.420652389526367, -28.052417755126953, -26.684185028076172, -25.315950393676758, -23.947715759277344, -22.579483032226562, -21.211252212524414, -19.843017578125, -18.47478485107422, -17.106550216674805, -15.738316535949707, -14.37008285522461, -13.001848220825195, -11.633614540100098, -10.265380859375, -8.897147178649902, -7.5289130210876465, -6.160678863525391, -4.792445182800293, -3.4242115020751953, -2.0559768676757812, -0.6877431869506836, 0.6804904937744141, 2.048724412918091, 3.4169583320617676, 4.785192489624023, 6.153426170349121, 7.521659851074219, 8.889894485473633, 10.25812816619873, 11.626361846923828, 12.994595527648926, 14.362829208374023, 15.731063842773438, 17.09929656982422, 18.467531204223633, 19.835765838623047, 21.203998565673828, 22.572233200073242]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 4.0, 4.0, 14.0, 18.0, 34.0, 51.0, 79.0, 192.0, 446.0, 1296.0, 5598.0, 31957.0, 317857.0, 611636.0, 66227.0, 9819.0, 2167.0, 639.0, 249.0, 102.0, 59.0, 26.0, 30.0, 14.0, 8.0, 7.0, 6.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.84375, -19.9814453125, -19.119140625, -18.2568359375, -17.39453125, -16.5322265625, -15.669921875, -14.8076171875, -13.9453125, -13.0830078125, -12.220703125, -11.3583984375, -10.49609375, -9.6337890625, -8.771484375, -7.9091796875, -7.046875, -6.1845703125, -5.322265625, -4.4599609375, -3.59765625, -2.7353515625, -1.873046875, -1.0107421875, -0.1484375, 0.7138671875, 1.576171875, 2.4384765625, 3.30078125, 4.1630859375, 5.025390625, 5.8876953125, 6.75, 7.6123046875, 8.474609375, 9.3369140625, 10.19921875, 11.0615234375, 11.923828125, 12.7861328125, 13.6484375, 14.5107421875, 15.373046875, 16.2353515625, 17.09765625, 17.9599609375, 18.822265625, 19.6845703125, 20.546875, 21.4091796875, 22.271484375, 23.1337890625, 23.99609375, 24.8583984375, 25.720703125, 26.5830078125, 27.4453125, 28.3076171875, 29.169921875, 30.0322265625, 30.89453125, 31.7568359375, 32.619140625, 33.4814453125, 34.34375]}, "gradients/decoder.model.decoder.layers.10.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 12.0, 17.0, 26.0, 39.0, 55.0, 58.0, 64.0, 81.0, 90.0, 97.0, 96.0, 87.0, 79.0, 81.0, 43.0, 30.0, 21.0, 11.0, 8.0, 1.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.25, -75.509765625, -73.76953125, -72.029296875, -70.2890625, -68.548828125, -66.80859375, -65.068359375, -63.328125, -61.587890625, -59.84765625, -58.107421875, -56.3671875, -54.626953125, -52.88671875, -51.146484375, -49.40625, -47.666015625, -45.92578125, -44.185546875, -42.4453125, -40.705078125, -38.96484375, -37.224609375, -35.484375, -33.744140625, -32.00390625, -30.263671875, -28.5234375, -26.783203125, -25.04296875, -23.302734375, -21.5625, -19.822265625, -18.08203125, -16.341796875, -14.6015625, -12.861328125, -11.12109375, -9.380859375, -7.640625, -5.900390625, -4.16015625, -2.419921875, -0.6796875, 1.060546875, 2.80078125, 4.541015625, 6.28125, 8.021484375, 9.76171875, 11.501953125, 13.2421875, 14.982421875, 16.72265625, 18.462890625, 20.203125, 21.943359375, 23.68359375, 25.423828125, 27.1640625, 28.904296875, 30.64453125, 32.384765625, 34.125]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 5.0, 2.0, 6.0, 5.0, 8.0, 8.0, 6.0, 8.0, 13.0, 16.0, 30.0, 26.0, 30.0, 56.0, 74.0, 116.0, 155.0, 238.0, 1617.0, 972202.0, 72669.0, 592.0, 195.0, 125.0, 84.0, 76.0, 58.0, 31.0, 18.0, 22.0, 13.0, 9.0, 12.0, 7.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-132.375, -128.341796875, -124.30859375, -120.275390625, -116.2421875, -112.208984375, -108.17578125, -104.142578125, -100.109375, -96.076171875, -92.04296875, -88.009765625, -83.9765625, -79.943359375, -75.91015625, -71.876953125, -67.84375, -63.810546875, -59.77734375, -55.744140625, -51.7109375, -47.677734375, -43.64453125, -39.611328125, -35.578125, -31.544921875, -27.51171875, -23.478515625, -19.4453125, -15.412109375, -11.37890625, -7.345703125, -3.3125, 0.720703125, 4.75390625, 8.787109375, 12.8203125, 16.853515625, 20.88671875, 24.919921875, 28.953125, 32.986328125, 37.01953125, 41.052734375, 45.0859375, 49.119140625, 53.15234375, 57.185546875, 61.21875, 65.251953125, 69.28515625, 73.318359375, 77.3515625, 81.384765625, 85.41796875, 89.451171875, 93.484375, 97.517578125, 101.55078125, 105.583984375, 109.6171875, 113.650390625, 117.68359375, 121.716796875, 125.75]}, "gradients/decoder.model.decoder.layers.10.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 9.0, 10.0, 16.0, 15.0, 21.0, 38.0, 48.0, 64.0, 60.0, 61.0, 62.0, 65.0, 69.0, 78.0, 73.0, 79.0, 47.0, 36.0, 33.0, 31.0, 16.0, 14.0, 7.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-57.4375, -55.70361328125, -53.9697265625, -52.23583984375, -50.501953125, -48.76806640625, -47.0341796875, -45.30029296875, -43.56640625, -41.83251953125, -40.0986328125, -38.36474609375, -36.630859375, -34.89697265625, -33.1630859375, -31.42919921875, -29.6953125, -27.96142578125, -26.2275390625, -24.49365234375, -22.759765625, -21.02587890625, -19.2919921875, -17.55810546875, -15.82421875, -14.09033203125, -12.3564453125, -10.62255859375, -8.888671875, -7.15478515625, -5.4208984375, -3.68701171875, -1.953125, -0.21923828125, 1.5146484375, 3.24853515625, 4.982421875, 6.71630859375, 8.4501953125, 10.18408203125, 11.91796875, 13.65185546875, 15.3857421875, 17.11962890625, 18.853515625, 20.58740234375, 22.3212890625, 24.05517578125, 25.7890625, 27.52294921875, 29.2568359375, 30.99072265625, 32.724609375, 34.45849609375, 36.1923828125, 37.92626953125, 39.66015625, 41.39404296875, 43.1279296875, 44.86181640625, 46.595703125, 48.32958984375, 50.0634765625, 51.79736328125, 53.53125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 1.0, 6.0, 9.0, 23.0, 20.0, 39.0, 46.0, 88.0, 246.0, 1828.0, 106146.0, 934513.0, 4845.0, 421.0, 120.0, 73.0, 43.0, 27.0, 26.0, 13.0, 1.0, 4.0, 4.0, 6.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.828125, -30.86865234375, -29.9091796875, -28.94970703125, -27.990234375, -27.03076171875, -26.0712890625, -25.11181640625, -24.15234375, -23.19287109375, -22.2333984375, -21.27392578125, -20.314453125, -19.35498046875, -18.3955078125, -17.43603515625, -16.4765625, -15.51708984375, -14.5576171875, -13.59814453125, -12.638671875, -11.67919921875, -10.7197265625, -9.76025390625, -8.80078125, -7.84130859375, -6.8818359375, -5.92236328125, -4.962890625, -4.00341796875, -3.0439453125, -2.08447265625, -1.125, -0.16552734375, 0.7939453125, 1.75341796875, 2.712890625, 3.67236328125, 4.6318359375, 5.59130859375, 6.55078125, 7.51025390625, 8.4697265625, 9.42919921875, 10.388671875, 11.34814453125, 12.3076171875, 13.26708984375, 14.2265625, 15.18603515625, 16.1455078125, 17.10498046875, 18.064453125, 19.02392578125, 19.9833984375, 20.94287109375, 21.90234375, 22.86181640625, 23.8212890625, 24.78076171875, 25.740234375, 26.69970703125, 27.6591796875, 28.61865234375, 29.578125]}, "gradients/decoder.model.decoder.layers.10.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 5.0, 13.0, 10.0, 17.0, 21.0, 37.0, 64.0, 97.0, 142.0, 176.0, 145.0, 91.0, 60.0, 44.0, 25.0, 14.0, 11.0, 8.0, 5.0, 3.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0014886856079101562, -0.00144118070602417, -0.0013936758041381836, -0.0013461709022521973, -0.001298666000366211, -0.0012511610984802246, -0.0012036561965942383, -0.001156151294708252, -0.0011086463928222656, -0.0010611414909362793, -0.001013636589050293, -0.0009661316871643066, -0.0009186267852783203, -0.000871121883392334, -0.0008236169815063477, -0.0007761120796203613, -0.000728607177734375, -0.0006811022758483887, -0.0006335973739624023, -0.000586092472076416, -0.0005385875701904297, -0.0004910826683044434, -0.00044357776641845703, -0.0003960728645324707, -0.0003485679626464844, -0.00030106306076049805, -0.0002535581588745117, -0.0002060532569885254, -0.00015854835510253906, -0.00011104345321655273, -6.35385513305664e-05, -1.6033649444580078e-05, 3.147125244140625e-05, 7.897615432739258e-05, 0.0001264810562133789, 0.00017398595809936523, 0.00022149085998535156, 0.0002689957618713379, 0.0003165006637573242, 0.00036400556564331055, 0.0004115104675292969, 0.0004590153694152832, 0.0005065202713012695, 0.0005540251731872559, 0.0006015300750732422, 0.0006490349769592285, 0.0006965398788452148, 0.0007440447807312012, 0.0007915496826171875, 0.0008390545845031738, 0.0008865594863891602, 0.0009340643882751465, 0.0009815692901611328, 0.0010290741920471191, 0.0010765790939331055, 0.0011240839958190918, 0.0011715888977050781, 0.0012190937995910645, 0.0012665987014770508, 0.0013141036033630371, 0.0013616085052490234, 0.0014091134071350098, 0.001456618309020996, 0.0015041232109069824, 0.0015516281127929688]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 5.0, 6.0, 12.0, 7.0, 14.0, 14.0, 37.0, 39.0, 73.0, 137.0, 500.0, 5672.0, 772546.0, 266017.0, 2827.0, 313.0, 107.0, 81.0, 36.0, 24.0, 24.0, 7.0, 13.0, 13.0, 1.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.1875, -19.48876953125, -18.7900390625, -18.09130859375, -17.392578125, -16.69384765625, -15.9951171875, -15.29638671875, -14.59765625, -13.89892578125, -13.2001953125, -12.50146484375, -11.802734375, -11.10400390625, -10.4052734375, -9.70654296875, -9.0078125, -8.30908203125, -7.6103515625, -6.91162109375, -6.212890625, -5.51416015625, -4.8154296875, -4.11669921875, -3.41796875, -2.71923828125, -2.0205078125, -1.32177734375, -0.623046875, 0.07568359375, 0.7744140625, 1.47314453125, 2.171875, 2.87060546875, 3.5693359375, 4.26806640625, 4.966796875, 5.66552734375, 6.3642578125, 7.06298828125, 7.76171875, 8.46044921875, 9.1591796875, 9.85791015625, 10.556640625, 11.25537109375, 11.9541015625, 12.65283203125, 13.3515625, 14.05029296875, 14.7490234375, 15.44775390625, 16.146484375, 16.84521484375, 17.5439453125, 18.24267578125, 18.94140625, 19.64013671875, 20.3388671875, 21.03759765625, 21.736328125, 22.43505859375, 23.1337890625, 23.83251953125, 24.53125]}, "gradients/decoder.model.decoder.layers.10.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 12.0, 18.0, 18.0, 27.0, 36.0, 41.0, 49.0, 65.0, 73.0, 81.0, 88.0, 100.0, 88.0, 66.0, 49.0, 32.0, 24.0, 32.0, 13.0, 29.0, 12.0, 12.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.939453125, -2.852325439453125, -2.76519775390625, -2.678070068359375, -2.5909423828125, -2.503814697265625, -2.41668701171875, -2.329559326171875, -2.242431640625, -2.155303955078125, -2.06817626953125, -1.981048583984375, -1.8939208984375, -1.806793212890625, -1.71966552734375, -1.632537841796875, -1.54541015625, -1.458282470703125, -1.37115478515625, -1.284027099609375, -1.1968994140625, -1.109771728515625, -1.02264404296875, -0.935516357421875, -0.848388671875, -0.761260986328125, -0.67413330078125, -0.587005615234375, -0.4998779296875, -0.412750244140625, -0.32562255859375, -0.238494873046875, -0.1513671875, -0.064239501953125, 0.02288818359375, 0.110015869140625, 0.1971435546875, 0.284271240234375, 0.37139892578125, 0.458526611328125, 0.545654296875, 0.632781982421875, 0.71990966796875, 0.807037353515625, 0.8941650390625, 0.981292724609375, 1.06842041015625, 1.155548095703125, 1.24267578125, 1.329803466796875, 1.41693115234375, 1.504058837890625, 1.5911865234375, 1.678314208984375, 1.76544189453125, 1.852569580078125, 1.939697265625, 2.026824951171875, 2.11395263671875, 2.201080322265625, 2.2882080078125, 2.375335693359375, 2.46246337890625, 2.549591064453125, 2.63671875]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 19.0, 237.0, 590.0, 143.0, 18.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-411.79559326171875, -404.2203674316406, -396.6451416015625, -389.0699462890625, -381.4947204589844, -373.91949462890625, -366.3442687988281, -358.76904296875, -351.19384765625, -343.6186218261719, -336.04339599609375, -328.46820068359375, -320.8929748535156, -313.3177490234375, -305.7425231933594, -298.16729736328125, -290.5920715332031, -283.016845703125, -275.4416198730469, -267.8664245605469, -260.29119873046875, -252.71597290039062, -245.1407470703125, -237.56553649902344, -229.99032592773438, -222.41510009765625, -214.8398895263672, -207.26466369628906, -199.689453125, -192.11422729492188, -184.53900146484375, -176.9637908935547, -169.38858032226562, -161.8133544921875, -154.23814392089844, -146.6629180908203, -139.08770751953125, -131.51248168945312, -123.93726348876953, -116.36204528808594, -108.78681945800781, -101.21160125732422, -93.63638305664062, -86.0611572265625, -78.4859390258789, -70.91072082519531, -63.33550262451172, -55.76028060913086, -48.18505859375, -40.609840393066406, -33.03461837768555, -25.459400177001953, -17.884180068969727, -10.3089599609375, -2.7337417602539062, 4.841480255126953, 12.416698455810547, 19.991918563842773, 27.567138671875, 35.142356872558594, 42.71757507324219, 50.29279708862305, 57.86801528930664, 65.4432373046875, 73.0184555053711]}, "gradients/decoder.model.decoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 7.0, 5.0, 6.0, 18.0, 16.0, 13.0, 15.0, 21.0, 29.0, 30.0, 47.0, 51.0, 37.0, 46.0, 63.0, 50.0, 60.0, 57.0, 60.0, 63.0, 52.0, 45.0, 37.0, 35.0, 27.0, 19.0, 13.0, 22.0, 16.0, 10.0, 10.0, 7.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-63.365135192871094, -61.59109115600586, -59.817047119140625, -58.042999267578125, -56.26895523071289, -54.494911193847656, -52.72086715698242, -50.94682312011719, -49.17277526855469, -47.39873123168945, -45.62468719482422, -43.85063934326172, -42.076595306396484, -40.30255126953125, -38.528507232666016, -36.75446319580078, -34.98041915893555, -33.20637512207031, -31.432329177856445, -29.65828514099121, -27.884239196777344, -26.11019515991211, -24.336151123046875, -22.56210708618164, -20.788061141967773, -19.01401710510254, -17.239971160888672, -15.465927124023438, -13.691882133483887, -11.917837142944336, -10.143793106079102, -8.36974811553955, -6.595703125, -4.821658134460449, -3.0476136207580566, -1.273569107055664, 0.5004758834838867, 2.2745208740234375, 4.048564910888672, 5.822609901428223, 7.596654891967773, 9.370699882507324, 11.144744873046875, 12.91878890991211, 14.69283390045166, 16.46687889099121, 18.240922927856445, 20.014968872070312, 21.789012908935547, 23.56305694580078, 25.33710289001465, 27.111146926879883, 28.88519287109375, 30.659236907958984, 32.43328094482422, 34.20732498168945, 35.98136901855469, 37.75541305541992, 39.529457092285156, 41.303504943847656, 43.07754898071289, 44.851593017578125, 46.62563705444336, 48.399681091308594, 50.173728942871094]}, "gradients/decoder.model.decoder.layers.9.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 3.0, 12.0, 9.0, 4.0, 15.0, 13.0, 19.0, 28.0, 33.0, 39.0, 45.0, 69.0, 95.0, 131.0, 275.0, 514.0, 1374.0, 6076.0, 47434.0, 588243.0, 2708947.0, 765245.0, 61313.0, 8500.0, 1907.0, 914.0, 751.0, 661.0, 638.0, 455.0, 266.0, 122.0, 44.0, 18.0, 17.0, 9.0, 5.0, 4.0, 6.0, 3.0, 3.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-34.21875, -33.198974609375, -32.17919921875, -31.159423828125, -30.1396484375, -29.119873046875, -28.10009765625, -27.080322265625, -26.060546875, -25.040771484375, -24.02099609375, -23.001220703125, -21.9814453125, -20.961669921875, -19.94189453125, -18.922119140625, -17.90234375, -16.882568359375, -15.86279296875, -14.843017578125, -13.8232421875, -12.803466796875, -11.78369140625, -10.763916015625, -9.744140625, -8.724365234375, -7.70458984375, -6.684814453125, -5.6650390625, -4.645263671875, -3.62548828125, -2.605712890625, -1.5859375, -0.566162109375, 0.45361328125, 1.473388671875, 2.4931640625, 3.512939453125, 4.53271484375, 5.552490234375, 6.572265625, 7.592041015625, 8.61181640625, 9.631591796875, 10.6513671875, 11.671142578125, 12.69091796875, 13.710693359375, 14.73046875, 15.750244140625, 16.77001953125, 17.789794921875, 18.8095703125, 19.829345703125, 20.84912109375, 21.868896484375, 22.888671875, 23.908447265625, 24.92822265625, 25.947998046875, 26.9677734375, 27.987548828125, 29.00732421875, 30.027099609375, 31.046875]}, "gradients/decoder.model.decoder.layers.9.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 8.0, 12.0, 27.0, 38.0, 66.0, 96.0, 127.0, 158.0, 132.0, 131.0, 99.0, 50.0, 31.0, 15.0, 11.0, 6.0, 4.0, 0.0, 3.0], "bins": [-89.75, -88.0498046875, -86.349609375, -84.6494140625, -82.94921875, -81.2490234375, -79.548828125, -77.8486328125, -76.1484375, -74.4482421875, -72.748046875, -71.0478515625, -69.34765625, -67.6474609375, -65.947265625, -64.2470703125, -62.546875, -60.8466796875, -59.146484375, -57.4462890625, -55.74609375, -54.0458984375, -52.345703125, -50.6455078125, -48.9453125, -47.2451171875, -45.544921875, -43.8447265625, -42.14453125, -40.4443359375, -38.744140625, -37.0439453125, -35.34375, -33.6435546875, -31.943359375, -30.2431640625, -28.54296875, -26.8427734375, -25.142578125, -23.4423828125, -21.7421875, -20.0419921875, -18.341796875, -16.6416015625, -14.94140625, -13.2412109375, -11.541015625, -9.8408203125, -8.140625, -6.4404296875, -4.740234375, -3.0400390625, -1.33984375, 0.3603515625, 2.060546875, 3.7607421875, 5.4609375, 7.1611328125, 8.861328125, 10.5615234375, 12.26171875, 13.9619140625, 15.662109375, 17.3623046875, 19.0625]}, "gradients/decoder.model.decoder.layers.9.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 6.0, 7.0, 9.0, 10.0, 12.0, 28.0, 40.0, 62.0, 167.0, 345.0, 1285.0, 27180.0, 4133214.0, 29927.0, 1260.0, 363.0, 168.0, 75.0, 48.0, 20.0, 13.0, 8.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-114.375, -111.060546875, -107.74609375, -104.431640625, -101.1171875, -97.802734375, -94.48828125, -91.173828125, -87.859375, -84.544921875, -81.23046875, -77.916015625, -74.6015625, -71.287109375, -67.97265625, -64.658203125, -61.34375, -58.029296875, -54.71484375, -51.400390625, -48.0859375, -44.771484375, -41.45703125, -38.142578125, -34.828125, -31.513671875, -28.19921875, -24.884765625, -21.5703125, -18.255859375, -14.94140625, -11.626953125, -8.3125, -4.998046875, -1.68359375, 1.630859375, 4.9453125, 8.259765625, 11.57421875, 14.888671875, 18.203125, 21.517578125, 24.83203125, 28.146484375, 31.4609375, 34.775390625, 38.08984375, 41.404296875, 44.71875, 48.033203125, 51.34765625, 54.662109375, 57.9765625, 61.291015625, 64.60546875, 67.919921875, 71.234375, 74.548828125, 77.86328125, 81.177734375, 84.4921875, 87.806640625, 91.12109375, 94.435546875, 97.75]}, "gradients/decoder.model.decoder.layers.9.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 7.0, 19.0, 23.0, 29.0, 34.0, 76.0, 109.0, 172.0, 336.0, 545.0, 802.0, 746.0, 495.0, 254.0, 175.0, 89.0, 45.0, 35.0, 27.0, 19.0, 6.0, 7.0, 7.0, 3.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.09375, -11.687744140625, -11.28173828125, -10.875732421875, -10.4697265625, -10.063720703125, -9.65771484375, -9.251708984375, -8.845703125, -8.439697265625, -8.03369140625, -7.627685546875, -7.2216796875, -6.815673828125, -6.40966796875, -6.003662109375, -5.59765625, -5.191650390625, -4.78564453125, -4.379638671875, -3.9736328125, -3.567626953125, -3.16162109375, -2.755615234375, -2.349609375, -1.943603515625, -1.53759765625, -1.131591796875, -0.7255859375, -0.319580078125, 0.08642578125, 0.492431640625, 0.8984375, 1.304443359375, 1.71044921875, 2.116455078125, 2.5224609375, 2.928466796875, 3.33447265625, 3.740478515625, 4.146484375, 4.552490234375, 4.95849609375, 5.364501953125, 5.7705078125, 6.176513671875, 6.58251953125, 6.988525390625, 7.39453125, 7.800537109375, 8.20654296875, 8.612548828125, 9.0185546875, 9.424560546875, 9.83056640625, 10.236572265625, 10.642578125, 11.048583984375, 11.45458984375, 11.860595703125, 12.2666015625, 12.672607421875, 13.07861328125, 13.484619140625, 13.890625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 11.0, 27.0, 56.0, 85.0, 147.0, 163.0, 182.0, 147.0, 92.0, 46.0, 20.0, 12.0, 7.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-89.4969482421875, -87.77714538574219, -86.05733489990234, -84.33753204345703, -82.61772155761719, -80.89791870117188, -79.17811584472656, -77.45830535888672, -75.7385025024414, -74.0186996459961, -72.29888916015625, -70.57908630371094, -68.8592758178711, -67.13947296142578, -65.41967010498047, -63.699859619140625, -61.98005676269531, -60.260250091552734, -58.540443420410156, -56.820640563964844, -55.100833892822266, -53.38102722167969, -51.66122055053711, -49.94141387939453, -48.22160720825195, -46.501800537109375, -44.7819938659668, -43.062191009521484, -41.342384338378906, -39.62257766723633, -37.90277099609375, -36.18296813964844, -34.46316146850586, -32.74335479736328, -31.023550033569336, -29.303743362426758, -27.583938598632812, -25.864131927490234, -24.144325256347656, -22.42452049255371, -20.704715728759766, -18.984909057617188, -17.265104293823242, -15.545297622680664, -13.825492858886719, -12.10568618774414, -10.385880470275879, -8.666074752807617, -6.946268081665039, -5.226462364196777, -3.5066564083099365, -1.7868504524230957, -0.06704473495483398, 1.652761459350586, 3.3725671768188477, 5.092372894287109, 6.812178611755371, 8.531984329223633, 10.251790046691895, 11.971595764160156, 13.691402435302734, 15.411208152770996, 17.131013870239258, 18.850818634033203, 20.57062530517578]}, "gradients/decoder.model.decoder.layers.9.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 4.0, 17.0, 15.0, 20.0, 30.0, 38.0, 74.0, 58.0, 86.0, 95.0, 105.0, 94.0, 86.0, 86.0, 65.0, 51.0, 32.0, 23.0, 14.0, 5.0, 8.0, 2.0, 1.0, 1.0, 0.0, 3.0], "bins": [-64.17044067382812, -62.849178314208984, -61.52791213989258, -60.20664978027344, -58.8853874206543, -57.56412124633789, -56.24285888671875, -54.921592712402344, -53.6003303527832, -52.27906799316406, -50.957801818847656, -49.636539459228516, -48.315277099609375, -46.99401092529297, -45.67274856567383, -44.35148620605469, -43.03022003173828, -41.70895767211914, -40.387691497802734, -39.066429138183594, -37.74516677856445, -36.42390060424805, -35.102638244628906, -33.7813720703125, -32.460113525390625, -31.13884925842285, -29.81758689880371, -28.496322631835938, -27.175058364868164, -25.85379409790039, -24.53253173828125, -23.211267471313477, -21.890005111694336, -20.568740844726562, -19.247478485107422, -17.92621421813965, -16.604949951171875, -15.283686637878418, -13.962423324584961, -12.641159057617188, -11.31989574432373, -9.998632431030273, -8.6773681640625, -7.356104850769043, -6.034841060638428, -4.7135772705078125, -3.3923139572143555, -2.071049690246582, -0.749786376953125, 0.5714772939682007, 1.8927409648895264, 3.2140045166015625, 4.535268306732178, 5.856532096862793, 7.17779541015625, 8.499059677124023, 9.82032299041748, 11.141586303710938, 12.462850570678711, 13.784113883972168, 15.105377197265625, 16.4266414642334, 17.747905731201172, 19.069168090820312, 20.390432357788086]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 3.0, 9.0, 11.0, 17.0, 42.0, 87.0, 199.0, 673.0, 2848.0, 31051.0, 936437.0, 71824.0, 3979.0, 871.0, 277.0, 99.0, 54.0, 32.0, 11.0, 6.0, 4.0, 1.0, 1.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.859375, -12.314453125, -11.76953125, -11.224609375, -10.6796875, -10.134765625, -9.58984375, -9.044921875, -8.5, -7.955078125, -7.41015625, -6.865234375, -6.3203125, -5.775390625, -5.23046875, -4.685546875, -4.140625, -3.595703125, -3.05078125, -2.505859375, -1.9609375, -1.416015625, -0.87109375, -0.326171875, 0.21875, 0.763671875, 1.30859375, 1.853515625, 2.3984375, 2.943359375, 3.48828125, 4.033203125, 4.578125, 5.123046875, 5.66796875, 6.212890625, 6.7578125, 7.302734375, 7.84765625, 8.392578125, 8.9375, 9.482421875, 10.02734375, 10.572265625, 11.1171875, 11.662109375, 12.20703125, 12.751953125, 13.296875, 13.841796875, 14.38671875, 14.931640625, 15.4765625, 16.021484375, 16.56640625, 17.111328125, 17.65625, 18.201171875, 18.74609375, 19.291015625, 19.8359375, 20.380859375, 20.92578125, 21.470703125, 22.015625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 12.0, 15.0, 26.0, 49.0, 67.0, 98.0, 116.0, 127.0, 145.0, 114.0, 99.0, 63.0, 38.0, 19.0, 12.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-52.5625, -51.43896484375, -50.3154296875, -49.19189453125, -48.068359375, -46.94482421875, -45.8212890625, -44.69775390625, -43.57421875, -42.45068359375, -41.3271484375, -40.20361328125, -39.080078125, -37.95654296875, -36.8330078125, -35.70947265625, -34.5859375, -33.46240234375, -32.3388671875, -31.21533203125, -30.091796875, -28.96826171875, -27.8447265625, -26.72119140625, -25.59765625, -24.47412109375, -23.3505859375, -22.22705078125, -21.103515625, -19.97998046875, -18.8564453125, -17.73291015625, -16.609375, -15.48583984375, -14.3623046875, -13.23876953125, -12.115234375, -10.99169921875, -9.8681640625, -8.74462890625, -7.62109375, -6.49755859375, -5.3740234375, -4.25048828125, -3.126953125, -2.00341796875, -0.8798828125, 0.24365234375, 1.3671875, 2.49072265625, 3.6142578125, 4.73779296875, 5.861328125, 6.98486328125, 8.1083984375, 9.23193359375, 10.35546875, 11.47900390625, 12.6025390625, 13.72607421875, 14.849609375, 15.97314453125, 17.0966796875, 18.22021484375, 19.34375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 5.0, 6.0, 5.0, 9.0, 20.0, 36.0, 41.0, 66.0, 114.0, 202.0, 351.0, 552.0, 1127.0, 2105.0, 4193.0, 8861.0, 19275.0, 46618.0, 116535.0, 258468.0, 306335.0, 166195.0, 66872.0, 27292.0, 11866.0, 5580.0, 2579.0, 1442.0, 804.0, 421.0, 242.0, 136.0, 67.0, 59.0, 33.0, 19.0, 15.0, 3.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.767578125, -1.694549560546875, -1.62152099609375, -1.548492431640625, -1.4754638671875, -1.402435302734375, -1.32940673828125, -1.256378173828125, -1.183349609375, -1.110321044921875, -1.03729248046875, -0.964263916015625, -0.8912353515625, -0.818206787109375, -0.74517822265625, -0.672149658203125, -0.59912109375, -0.526092529296875, -0.45306396484375, -0.380035400390625, -0.3070068359375, -0.233978271484375, -0.16094970703125, -0.087921142578125, -0.014892578125, 0.058135986328125, 0.13116455078125, 0.204193115234375, 0.2772216796875, 0.350250244140625, 0.42327880859375, 0.496307373046875, 0.5693359375, 0.642364501953125, 0.71539306640625, 0.788421630859375, 0.8614501953125, 0.934478759765625, 1.00750732421875, 1.080535888671875, 1.153564453125, 1.226593017578125, 1.29962158203125, 1.372650146484375, 1.4456787109375, 1.518707275390625, 1.59173583984375, 1.664764404296875, 1.73779296875, 1.810821533203125, 1.88385009765625, 1.956878662109375, 2.0299072265625, 2.102935791015625, 2.17596435546875, 2.248992919921875, 2.322021484375, 2.395050048828125, 2.46807861328125, 2.541107177734375, 2.6141357421875, 2.687164306640625, 2.76019287109375, 2.833221435546875, 2.90625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 11.0, 8.0, 13.0, 11.0, 14.0, 17.0, 29.0, 26.0, 37.0, 36.0, 43.0, 50.0, 47.0, 62.0, 58.0, 59.0, 51.0, 35.0, 54.0, 43.0, 37.0, 41.0, 32.0, 29.0, 30.0, 20.0, 24.0, 24.0, 13.0, 10.0, 6.0, 7.0, 6.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.875, -23.92138671875, -22.9677734375, -22.01416015625, -21.060546875, -20.10693359375, -19.1533203125, -18.19970703125, -17.24609375, -16.29248046875, -15.3388671875, -14.38525390625, -13.431640625, -12.47802734375, -11.5244140625, -10.57080078125, -9.6171875, -8.66357421875, -7.7099609375, -6.75634765625, -5.802734375, -4.84912109375, -3.8955078125, -2.94189453125, -1.98828125, -1.03466796875, -0.0810546875, 0.87255859375, 1.826171875, 2.77978515625, 3.7333984375, 4.68701171875, 5.640625, 6.59423828125, 7.5478515625, 8.50146484375, 9.455078125, 10.40869140625, 11.3623046875, 12.31591796875, 13.26953125, 14.22314453125, 15.1767578125, 16.13037109375, 17.083984375, 18.03759765625, 18.9912109375, 19.94482421875, 20.8984375, 21.85205078125, 22.8056640625, 23.75927734375, 24.712890625, 25.66650390625, 26.6201171875, 27.57373046875, 28.52734375, 29.48095703125, 30.4345703125, 31.38818359375, 32.341796875, 33.29541015625, 34.2490234375, 35.20263671875, 36.15625]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 8.0, 13.0, 10.0, 13.0, 25.0, 41.0, 51.0, 90.0, 136.0, 253.0, 384.0, 955.0, 2077.0, 6017.0, 22378.0, 119862.0, 562783.0, 273914.0, 43565.0, 10139.0, 3202.0, 1229.0, 593.0, 309.0, 183.0, 106.0, 68.0, 60.0, 25.0, 12.0, 20.0, 9.0, 10.0, 8.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55517578125, -0.5382080078125, -0.521240234375, -0.5042724609375, -0.4873046875, -0.4703369140625, -0.453369140625, -0.4364013671875, -0.41943359375, -0.4024658203125, -0.385498046875, -0.3685302734375, -0.3515625, -0.3345947265625, -0.317626953125, -0.3006591796875, -0.28369140625, -0.2667236328125, -0.249755859375, -0.2327880859375, -0.2158203125, -0.1988525390625, -0.181884765625, -0.1649169921875, -0.14794921875, -0.1309814453125, -0.114013671875, -0.0970458984375, -0.080078125, -0.0631103515625, -0.046142578125, -0.0291748046875, -0.01220703125, 0.0047607421875, 0.021728515625, 0.0386962890625, 0.0556640625, 0.0726318359375, 0.089599609375, 0.1065673828125, 0.12353515625, 0.1405029296875, 0.157470703125, 0.1744384765625, 0.19140625, 0.2083740234375, 0.225341796875, 0.2423095703125, 0.25927734375, 0.2762451171875, 0.293212890625, 0.3101806640625, 0.3271484375, 0.3441162109375, 0.361083984375, 0.3780517578125, 0.39501953125, 0.4119873046875, 0.428955078125, 0.4459228515625, 0.462890625, 0.4798583984375, 0.496826171875, 0.5137939453125, 0.53076171875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 17.0, 15.0, 26.0, 31.0, 27.0, 41.0, 58.0, 58.0, 79.0, 94.0, 91.0, 97.0, 65.0, 56.0, 61.0, 42.0, 32.0, 16.0, 14.0, 9.0, 9.0, 6.0, 3.0, 11.0, 9.0, 2.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001900196075439453, -0.00018301233649253845, -0.0001760050654411316, -0.00016899779438972473, -0.00016199052333831787, -0.000154983252286911, -0.00014797598123550415, -0.0001409687101840973, -0.00013396143913269043, -0.00012695416808128357, -0.00011994689702987671, -0.00011293962597846985, -0.00010593235492706299, -9.892508387565613e-05, -9.191781282424927e-05, -8.491054177284241e-05, -7.790327072143555e-05, -7.089599967002869e-05, -6.388872861862183e-05, -5.6881457567214966e-05, -4.9874186515808105e-05, -4.2866915464401245e-05, -3.5859644412994385e-05, -2.8852373361587524e-05, -2.1845102310180664e-05, -1.4837831258773804e-05, -7.830560207366943e-06, -8.23289155960083e-07, 6.183981895446777e-06, 1.3191252946853638e-05, 2.0198523998260498e-05, 2.720579504966736e-05, 3.421306610107422e-05, 4.122033715248108e-05, 4.822760820388794e-05, 5.52348792552948e-05, 6.224215030670166e-05, 6.924942135810852e-05, 7.625669240951538e-05, 8.326396346092224e-05, 9.02712345123291e-05, 9.727850556373596e-05, 0.00010428577661514282, 0.00011129304766654968, 0.00011830031871795654, 0.0001253075897693634, 0.00013231486082077026, 0.00013932213187217712, 0.00014632940292358398, 0.00015333667397499084, 0.0001603439450263977, 0.00016735121607780457, 0.00017435848712921143, 0.00018136575818061829, 0.00018837302923202515, 0.000195380300283432, 0.00020238757133483887, 0.00020939484238624573, 0.0002164021134376526, 0.00022340938448905945, 0.0002304166555404663, 0.00023742392659187317, 0.00024443119764328003, 0.0002514384686946869, 0.00025844573974609375]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 5.0, 0.0, 11.0, 5.0, 7.0, 6.0, 18.0, 17.0, 33.0, 41.0, 65.0, 120.0, 198.0, 382.0, 883.0, 2047.0, 5849.0, 23862.0, 203318.0, 697345.0, 92893.0, 14364.0, 4129.0, 1509.0, 669.0, 317.0, 153.0, 93.0, 57.0, 40.0, 30.0, 20.0, 11.0, 11.0, 11.0, 8.0, 8.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.68505859375, -0.6632003784179688, -0.6413421630859375, -0.6194839477539062, -0.597625732421875, -0.5757675170898438, -0.5539093017578125, -0.5320510864257812, -0.51019287109375, -0.48833465576171875, -0.4664764404296875, -0.44461822509765625, -0.422760009765625, -0.40090179443359375, -0.3790435791015625, -0.35718536376953125, -0.3353271484375, -0.31346893310546875, -0.2916107177734375, -0.26975250244140625, -0.247894287109375, -0.22603607177734375, -0.2041778564453125, -0.18231964111328125, -0.16046142578125, -0.13860321044921875, -0.1167449951171875, -0.09488677978515625, -0.073028564453125, -0.05117034912109375, -0.0293121337890625, -0.00745391845703125, 0.014404296875, 0.03626251220703125, 0.0581207275390625, 0.07997894287109375, 0.101837158203125, 0.12369537353515625, 0.1455535888671875, 0.16741180419921875, 0.18927001953125, 0.21112823486328125, 0.2329864501953125, 0.25484466552734375, 0.276702880859375, 0.29856109619140625, 0.3204193115234375, 0.34227752685546875, 0.3641357421875, 0.38599395751953125, 0.4078521728515625, 0.42971038818359375, 0.451568603515625, 0.47342681884765625, 0.4952850341796875, 0.5171432495117188, 0.53900146484375, 0.5608596801757812, 0.5827178955078125, 0.6045761108398438, 0.626434326171875, 0.6482925415039062, 0.6701507568359375, 0.6920089721679688, 0.7138671875]}, "gradients/decoder.model.decoder.layers.9.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 11.0, 25.0, 45.0, 75.0, 104.0, 145.0, 151.0, 151.0, 100.0, 61.0, 44.0, 19.0, 9.0, 10.0, 3.0, 6.0, 0.0, 3.0, 0.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.2410888671875, -0.2338542938232422, -0.22661972045898438, -0.21938514709472656, -0.21215057373046875, -0.20491600036621094, -0.19768142700195312, -0.1904468536376953, -0.1832122802734375, -0.1759777069091797, -0.16874313354492188, -0.16150856018066406, -0.15427398681640625, -0.14703941345214844, -0.13980484008789062, -0.1325702667236328, -0.125335693359375, -0.11810111999511719, -0.11086654663085938, -0.10363197326660156, -0.09639739990234375, -0.08916282653808594, -0.08192825317382812, -0.07469367980957031, -0.0674591064453125, -0.06022453308105469, -0.052989959716796875, -0.04575538635253906, -0.03852081298828125, -0.03128623962402344, -0.024051666259765625, -0.016817092895507812, -0.00958251953125, -0.0023479461669921875, 0.004886627197265625, 0.012121200561523438, 0.01935577392578125, 0.026590347290039062, 0.033824920654296875, 0.04105949401855469, 0.0482940673828125, 0.05552864074707031, 0.06276321411132812, 0.06999778747558594, 0.07723236083984375, 0.08446693420410156, 0.09170150756835938, 0.09893608093261719, 0.106170654296875, 0.11340522766113281, 0.12063980102539062, 0.12787437438964844, 0.13510894775390625, 0.14234352111816406, 0.14957809448242188, 0.1568126678466797, 0.1640472412109375, 0.1712818145751953, 0.17851638793945312, 0.18575096130371094, 0.19298553466796875, 0.20022010803222656, 0.20745468139648438, 0.2146892547607422, 0.221923828125]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 22.0, 30.0, 57.0, 114.0, 143.0, 181.0, 180.0, 124.0, 67.0, 43.0, 15.0, 8.0, 3.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.88543701171875, -46.897682189941406, -45.9099235534668, -44.92216873168945, -43.934410095214844, -42.9466552734375, -41.958900451660156, -40.97114181518555, -39.9833869934082, -38.99563217163086, -38.00787353515625, -37.020118713378906, -36.0323600769043, -35.04460525512695, -34.056846618652344, -33.069091796875, -32.081336975097656, -31.09358024597168, -30.105823516845703, -29.11806869506836, -28.130311965942383, -27.142555236816406, -26.15479850769043, -25.167041778564453, -24.179283142089844, -23.191526412963867, -22.20376968383789, -21.216014862060547, -20.22825813293457, -19.240501403808594, -18.252744674682617, -17.26498794555664, -16.277233123779297, -15.28947639465332, -14.30172061920166, -13.313963890075684, -12.326208114624023, -11.338451385498047, -10.35069465637207, -9.362937927246094, -8.375181198120117, -7.387424945831299, -6.3996686935424805, -5.411911964416504, -4.4241557121276855, -3.436399459838867, -2.4486427307128906, -1.4608864784240723, -0.4731302261352539, 0.514626145362854, 1.502382516860962, 2.4901390075683594, 3.4778952598571777, 4.465651512145996, 5.453408241271973, 6.441164493560791, 7.428920745849609, 8.416677474975586, 9.404433250427246, 10.392189979553223, 11.379945755004883, 12.36770248413086, 13.355459213256836, 14.343215942382812, 15.330971717834473]}, "gradients/decoder.model.decoder.layers.9.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 13.0, 20.0, 20.0, 45.0, 70.0, 95.0, 115.0, 136.0, 128.0, 118.0, 95.0, 74.0, 37.0, 22.0, 7.0, 4.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-51.77899932861328, -50.717899322509766, -49.656795501708984, -48.59569549560547, -47.53459167480469, -46.47349166870117, -45.41238784790039, -44.351287841796875, -43.290184020996094, -42.22908401489258, -41.1679801940918, -40.10688018798828, -39.0457763671875, -37.984676361083984, -36.9235725402832, -35.86247253417969, -34.801368713378906, -33.74026870727539, -32.67916488647461, -31.61806297302246, -30.556961059570312, -29.495859146118164, -28.434757232666016, -27.3736572265625, -26.312557220458984, -25.251455307006836, -24.190353393554688, -23.12925148010254, -22.06814956665039, -21.007047653198242, -19.945945739746094, -18.884845733642578, -17.823740005493164, -16.762638092041016, -15.701536178588867, -14.640434265136719, -13.57933235168457, -12.518230438232422, -11.45712947845459, -10.396027565002441, -9.334925651550293, -8.273823738098145, -7.212721824645996, -6.151620388031006, -5.090518474578857, -4.029416561126709, -2.9683151245117188, -1.9072132110595703, -0.8461112976074219, 0.214990496635437, 1.276092290878296, 2.3371939659118652, 3.3982958793640137, 4.459397792816162, 5.520499229431152, 6.581601142883301, 7.642703056335449, 8.703804969787598, 9.764906883239746, 10.826007843017578, 11.887109756469727, 12.948211669921875, 14.009313583374023, 15.070415496826172, 16.13151741027832]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 10.0, 16.0, 19.0, 56.0, 81.0, 254.0, 759.0, 3626.0, 26283.0, 341991.0, 619175.0, 48647.0, 5858.0, 1174.0, 330.0, 126.0, 52.0, 32.0, 18.0, 10.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.0625, -23.236572265625, -22.41064453125, -21.584716796875, -20.7587890625, -19.932861328125, -19.10693359375, -18.281005859375, -17.455078125, -16.629150390625, -15.80322265625, -14.977294921875, -14.1513671875, -13.325439453125, -12.49951171875, -11.673583984375, -10.84765625, -10.021728515625, -9.19580078125, -8.369873046875, -7.5439453125, -6.718017578125, -5.89208984375, -5.066162109375, -4.240234375, -3.414306640625, -2.58837890625, -1.762451171875, -0.9365234375, -0.110595703125, 0.71533203125, 1.541259765625, 2.3671875, 3.193115234375, 4.01904296875, 4.844970703125, 5.6708984375, 6.496826171875, 7.32275390625, 8.148681640625, 8.974609375, 9.800537109375, 10.62646484375, 11.452392578125, 12.2783203125, 13.104248046875, 13.93017578125, 14.756103515625, 15.58203125, 16.407958984375, 17.23388671875, 18.059814453125, 18.8857421875, 19.711669921875, 20.53759765625, 21.363525390625, 22.189453125, 23.015380859375, 23.84130859375, 24.667236328125, 25.4931640625, 26.319091796875, 27.14501953125, 27.970947265625, 28.796875]}, "gradients/decoder.model.decoder.layers.9.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 11.0, 19.0, 22.0, 28.0, 46.0, 65.0, 83.0, 102.0, 122.0, 130.0, 102.0, 82.0, 70.0, 59.0, 28.0, 17.0, 9.0, 6.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-87.75, -85.988037109375, -84.22607421875, -82.464111328125, -80.7021484375, -78.940185546875, -77.17822265625, -75.416259765625, -73.654296875, -71.892333984375, -70.13037109375, -68.368408203125, -66.6064453125, -64.844482421875, -63.08251953125, -61.320556640625, -59.55859375, -57.796630859375, -56.03466796875, -54.272705078125, -52.5107421875, -50.748779296875, -48.98681640625, -47.224853515625, -45.462890625, -43.700927734375, -41.93896484375, -40.177001953125, -38.4150390625, -36.653076171875, -34.89111328125, -33.129150390625, -31.3671875, -29.605224609375, -27.84326171875, -26.081298828125, -24.3193359375, -22.557373046875, -20.79541015625, -19.033447265625, -17.271484375, -15.509521484375, -13.74755859375, -11.985595703125, -10.2236328125, -8.461669921875, -6.69970703125, -4.937744140625, -3.17578125, -1.413818359375, 0.34814453125, 2.110107421875, 3.8720703125, 5.634033203125, 7.39599609375, 9.157958984375, 10.919921875, 12.681884765625, 14.44384765625, 16.205810546875, 17.9677734375, 19.729736328125, 21.49169921875, 23.253662109375, 25.015625]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 6.0, 10.0, 13.0, 9.0, 15.0, 21.0, 16.0, 21.0, 30.0, 29.0, 28.0, 43.0, 55.0, 78.0, 167.0, 1195.0, 962511.0, 83323.0, 481.0, 128.0, 66.0, 60.0, 41.0, 23.0, 38.0, 24.0, 22.0, 20.0, 11.0, 8.0, 14.0, 9.0, 8.0, 10.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-127.9375, -124.3681640625, -120.798828125, -117.2294921875, -113.66015625, -110.0908203125, -106.521484375, -102.9521484375, -99.3828125, -95.8134765625, -92.244140625, -88.6748046875, -85.10546875, -81.5361328125, -77.966796875, -74.3974609375, -70.828125, -67.2587890625, -63.689453125, -60.1201171875, -56.55078125, -52.9814453125, -49.412109375, -45.8427734375, -42.2734375, -38.7041015625, -35.134765625, -31.5654296875, -27.99609375, -24.4267578125, -20.857421875, -17.2880859375, -13.71875, -10.1494140625, -6.580078125, -3.0107421875, 0.55859375, 4.1279296875, 7.697265625, 11.2666015625, 14.8359375, 18.4052734375, 21.974609375, 25.5439453125, 29.11328125, 32.6826171875, 36.251953125, 39.8212890625, 43.390625, 46.9599609375, 50.529296875, 54.0986328125, 57.66796875, 61.2373046875, 64.806640625, 68.3759765625, 71.9453125, 75.5146484375, 79.083984375, 82.6533203125, 86.22265625, 89.7919921875, 93.361328125, 96.9306640625, 100.5]}, "gradients/decoder.model.decoder.layers.9.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 7.0, 6.0, 10.0, 15.0, 16.0, 18.0, 8.0, 24.0, 27.0, 34.0, 33.0, 41.0, 48.0, 48.0, 60.0, 71.0, 49.0, 59.0, 55.0, 55.0, 51.0, 41.0, 36.0, 29.0, 41.0, 22.0, 24.0, 13.0, 13.0, 15.0, 11.0, 10.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.890625, -28.848876953125, -27.80712890625, -26.765380859375, -25.7236328125, -24.681884765625, -23.64013671875, -22.598388671875, -21.556640625, -20.514892578125, -19.47314453125, -18.431396484375, -17.3896484375, -16.347900390625, -15.30615234375, -14.264404296875, -13.22265625, -12.180908203125, -11.13916015625, -10.097412109375, -9.0556640625, -8.013916015625, -6.97216796875, -5.930419921875, -4.888671875, -3.846923828125, -2.80517578125, -1.763427734375, -0.7216796875, 0.320068359375, 1.36181640625, 2.403564453125, 3.4453125, 4.487060546875, 5.52880859375, 6.570556640625, 7.6123046875, 8.654052734375, 9.69580078125, 10.737548828125, 11.779296875, 12.821044921875, 13.86279296875, 14.904541015625, 15.9462890625, 16.988037109375, 18.02978515625, 19.071533203125, 20.11328125, 21.155029296875, 22.19677734375, 23.238525390625, 24.2802734375, 25.322021484375, 26.36376953125, 27.405517578125, 28.447265625, 29.489013671875, 30.53076171875, 31.572509765625, 32.6142578125, 33.656005859375, 34.69775390625, 35.739501953125, 36.78125]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 5.0, 7.0, 11.0, 8.0, 14.0, 19.0, 29.0, 53.0, 79.0, 203.0, 648.0, 3125.0, 49597.0, 965327.0, 26152.0, 2385.0, 521.0, 173.0, 63.0, 31.0, 22.0, 22.0, 10.0, 11.0, 11.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.609375, -17.08251953125, -16.5556640625, -16.02880859375, -15.501953125, -14.97509765625, -14.4482421875, -13.92138671875, -13.39453125, -12.86767578125, -12.3408203125, -11.81396484375, -11.287109375, -10.76025390625, -10.2333984375, -9.70654296875, -9.1796875, -8.65283203125, -8.1259765625, -7.59912109375, -7.072265625, -6.54541015625, -6.0185546875, -5.49169921875, -4.96484375, -4.43798828125, -3.9111328125, -3.38427734375, -2.857421875, -2.33056640625, -1.8037109375, -1.27685546875, -0.75, -0.22314453125, 0.3037109375, 0.83056640625, 1.357421875, 1.88427734375, 2.4111328125, 2.93798828125, 3.46484375, 3.99169921875, 4.5185546875, 5.04541015625, 5.572265625, 6.09912109375, 6.6259765625, 7.15283203125, 7.6796875, 8.20654296875, 8.7333984375, 9.26025390625, 9.787109375, 10.31396484375, 10.8408203125, 11.36767578125, 11.89453125, 12.42138671875, 12.9482421875, 13.47509765625, 14.001953125, 14.52880859375, 15.0556640625, 15.58251953125, 16.109375]}, "gradients/decoder.model.decoder.layers.9.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 1.0, 5.0, 6.0, 12.0, 13.0, 19.0, 35.0, 31.0, 51.0, 56.0, 69.0, 80.0, 109.0, 116.0, 69.0, 78.0, 58.0, 40.0, 31.0, 28.0, 27.0, 15.0, 12.0, 9.0, 7.0, 6.0, 4.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0008234977722167969, -0.0007978752255439758, -0.0007722526788711548, -0.0007466301321983337, -0.0007210075855255127, -0.0006953850388526917, -0.0006697624921798706, -0.0006441399455070496, -0.0006185173988342285, -0.0005928948521614075, -0.0005672723054885864, -0.0005416497588157654, -0.0005160272121429443, -0.0004904046654701233, -0.00046478211879730225, -0.0004391595721244812, -0.00041353702545166016, -0.0003879144787788391, -0.00036229193210601807, -0.000336669385433197, -0.000311046838760376, -0.00028542429208755493, -0.0002598017454147339, -0.00023417919874191284, -0.0002085566520690918, -0.00018293410539627075, -0.0001573115587234497, -0.00013168901205062866, -0.00010606646537780762, -8.044391870498657e-05, -5.482137203216553e-05, -2.9198825359344482e-05, -3.5762786865234375e-06, 2.2046267986297607e-05, 4.766881465911865e-05, 7.32913613319397e-05, 9.891390800476074e-05, 0.0001245364546775818, 0.00015015900135040283, 0.00017578154802322388, 0.00020140409469604492, 0.00022702664136886597, 0.000252649188041687, 0.00027827173471450806, 0.0003038942813873291, 0.00032951682806015015, 0.0003551393747329712, 0.00038076192140579224, 0.0004063844680786133, 0.0004320070147514343, 0.00045762956142425537, 0.0004832521080970764, 0.0005088746547698975, 0.0005344972014427185, 0.0005601197481155396, 0.0005857422947883606, 0.0006113648414611816, 0.0006369873881340027, 0.0006626099348068237, 0.0006882324814796448, 0.0007138550281524658, 0.0007394775748252869, 0.0007651001214981079, 0.000790722668170929, 0.00081634521484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 3.0, 3.0, 7.0, 11.0, 14.0, 18.0, 18.0, 21.0, 29.0, 48.0, 87.0, 127.0, 222.0, 488.0, 1092.0, 3054.0, 10648.0, 58427.0, 433903.0, 460394.0, 62960.0, 11294.0, 3266.0, 1233.0, 518.0, 276.0, 138.0, 66.0, 55.0, 33.0, 26.0, 13.0, 14.0, 9.0, 9.0, 3.0, 10.0, 5.0, 5.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.515625, -5.3255615234375, -5.135498046875, -4.9454345703125, -4.75537109375, -4.5653076171875, -4.375244140625, -4.1851806640625, -3.9951171875, -3.8050537109375, -3.614990234375, -3.4249267578125, -3.23486328125, -3.0447998046875, -2.854736328125, -2.6646728515625, -2.474609375, -2.2845458984375, -2.094482421875, -1.9044189453125, -1.71435546875, -1.5242919921875, -1.334228515625, -1.1441650390625, -0.9541015625, -0.7640380859375, -0.573974609375, -0.3839111328125, -0.19384765625, -0.0037841796875, 0.186279296875, 0.3763427734375, 0.56640625, 0.7564697265625, 0.946533203125, 1.1365966796875, 1.32666015625, 1.5167236328125, 1.706787109375, 1.8968505859375, 2.0869140625, 2.2769775390625, 2.467041015625, 2.6571044921875, 2.84716796875, 3.0372314453125, 3.227294921875, 3.4173583984375, 3.607421875, 3.7974853515625, 3.987548828125, 4.1776123046875, 4.36767578125, 4.5577392578125, 4.747802734375, 4.9378662109375, 5.1279296875, 5.3179931640625, 5.508056640625, 5.6981201171875, 5.88818359375, 6.0782470703125, 6.268310546875, 6.4583740234375, 6.6484375]}, "gradients/decoder.model.decoder.layers.9.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 8.0, 8.0, 8.0, 6.0, 11.0, 18.0, 21.0, 21.0, 31.0, 48.0, 64.0, 83.0, 85.0, 93.0, 104.0, 82.0, 62.0, 56.0, 43.0, 27.0, 23.0, 14.0, 9.0, 15.0, 12.0, 5.0, 8.0, 9.0, 7.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.525390625, -2.44818115234375, -2.3709716796875, -2.29376220703125, -2.216552734375, -2.13934326171875, -2.0621337890625, -1.98492431640625, -1.90771484375, -1.83050537109375, -1.7532958984375, -1.67608642578125, -1.598876953125, -1.52166748046875, -1.4444580078125, -1.36724853515625, -1.2900390625, -1.21282958984375, -1.1356201171875, -1.05841064453125, -0.981201171875, -0.90399169921875, -0.8267822265625, -0.74957275390625, -0.67236328125, -0.59515380859375, -0.5179443359375, -0.44073486328125, -0.363525390625, -0.28631591796875, -0.2091064453125, -0.13189697265625, -0.0546875, 0.02252197265625, 0.0997314453125, 0.17694091796875, 0.254150390625, 0.33135986328125, 0.4085693359375, 0.48577880859375, 0.56298828125, 0.64019775390625, 0.7174072265625, 0.79461669921875, 0.871826171875, 0.94903564453125, 1.0262451171875, 1.10345458984375, 1.1806640625, 1.25787353515625, 1.3350830078125, 1.41229248046875, 1.489501953125, 1.56671142578125, 1.6439208984375, 1.72113037109375, 1.79833984375, 1.87554931640625, 1.9527587890625, 2.02996826171875, 2.107177734375, 2.18438720703125, 2.2615966796875, 2.33880615234375, 2.416015625]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 9.0, 29.0, 45.0, 97.0, 150.0, 175.0, 195.0, 139.0, 89.0, 39.0, 13.0, 7.0, 7.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-99.71598815917969, -97.583251953125, -95.45051574707031, -93.31777954101562, -91.18504333496094, -89.05230712890625, -86.91957092285156, -84.78682708740234, -82.65409088134766, -80.52135467529297, -78.38861846923828, -76.2558822631836, -74.1231460571289, -71.99040222167969, -69.857666015625, -67.72492980957031, -65.59219360351562, -63.45945739746094, -61.32672119140625, -59.19398498535156, -57.06124496459961, -54.92850875854492, -52.795772552490234, -50.66303634643555, -48.530303955078125, -46.39756774902344, -44.26483154296875, -42.13209533691406, -39.99935531616211, -37.86661911010742, -35.733882904052734, -33.60114669799805, -31.468406677246094, -29.335670471191406, -27.202932357788086, -25.0701961517334, -22.937458038330078, -20.80472183227539, -18.671985626220703, -16.539249420166016, -14.406511306762695, -12.273774147033691, -10.141036987304688, -8.00830078125, -5.875563621520996, -3.742826461791992, -1.6100902557373047, 0.5226469039916992, 2.655384063720703, 4.788121223449707, 6.920857906341553, 9.053594589233398, 11.186331748962402, 13.319068908691406, 15.451805114746094, 17.58454132080078, 19.7172794342041, 21.85001564025879, 23.98275375366211, 26.115489959716797, 28.248226165771484, 30.380964279174805, 32.513702392578125, 34.64643859863281, 36.7791748046875]}, "gradients/decoder.model.decoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 6.0, 7.0, 11.0, 26.0, 36.0, 30.0, 46.0, 48.0, 64.0, 69.0, 80.0, 92.0, 63.0, 83.0, 64.0, 66.0, 51.0, 42.0, 36.0, 26.0, 22.0, 7.0, 11.0, 7.0, 8.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-93.14926147460938, -90.99736785888672, -88.84547424316406, -86.6935806274414, -84.54168701171875, -82.38980102539062, -80.23789978027344, -78.08601379394531, -75.93412017822266, -73.7822265625, -71.63033294677734, -69.47843933105469, -67.32654571533203, -65.17465209960938, -63.022762298583984, -60.87086868286133, -58.71897506713867, -56.567081451416016, -54.41518783569336, -52.26329803466797, -50.11140441894531, -47.959510803222656, -45.8076171875, -43.655723571777344, -41.50382995605469, -39.35193634033203, -37.200042724609375, -35.04814910888672, -32.89625930786133, -30.744365692138672, -28.592472076416016, -26.44057846069336, -24.288684844970703, -22.136791229248047, -19.984899520874023, -17.833005905151367, -15.681113243103027, -13.529220581054688, -11.377326965332031, -9.225434303283691, -7.073541641235352, -4.921648979187012, -2.7697558403015137, -0.6178627014160156, 1.5340299606323242, 3.685922622680664, 5.83781623840332, 7.98970890045166, 10.1416015625, 12.29349422454834, 14.44538688659668, 16.597280502319336, 18.74917221069336, 20.901065826416016, 23.052959442138672, 25.204853057861328, 27.35674476623535, 29.508638381958008, 31.66053009033203, 33.81242370605469, 35.964317321777344, 38.1162109375, 40.268104553222656, 42.41999435424805, 44.5718879699707]}, "gradients/decoder.model.decoder.layers.8.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 4.0, 4.0, 8.0, 9.0, 12.0, 26.0, 32.0, 53.0, 106.0, 172.0, 326.0, 655.0, 1833.0, 8424.0, 86049.0, 1201589.0, 2523957.0, 336892.0, 25244.0, 4568.0, 1614.0, 1113.0, 832.0, 485.0, 175.0, 65.0, 19.0, 10.0, 7.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.375, -27.37060546875, -26.3662109375, -25.36181640625, -24.357421875, -23.35302734375, -22.3486328125, -21.34423828125, -20.33984375, -19.33544921875, -18.3310546875, -17.32666015625, -16.322265625, -15.31787109375, -14.3134765625, -13.30908203125, -12.3046875, -11.30029296875, -10.2958984375, -9.29150390625, -8.287109375, -7.28271484375, -6.2783203125, -5.27392578125, -4.26953125, -3.26513671875, -2.2607421875, -1.25634765625, -0.251953125, 0.75244140625, 1.7568359375, 2.76123046875, 3.765625, 4.77001953125, 5.7744140625, 6.77880859375, 7.783203125, 8.78759765625, 9.7919921875, 10.79638671875, 11.80078125, 12.80517578125, 13.8095703125, 14.81396484375, 15.818359375, 16.82275390625, 17.8271484375, 18.83154296875, 19.8359375, 20.84033203125, 21.8447265625, 22.84912109375, 23.853515625, 24.85791015625, 25.8623046875, 26.86669921875, 27.87109375, 28.87548828125, 29.8798828125, 30.88427734375, 31.888671875, 32.89306640625, 33.8974609375, 34.90185546875, 35.90625]}, "gradients/decoder.model.decoder.layers.8.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 15.0, 20.0, 32.0, 52.0, 83.0, 101.0, 109.0, 126.0, 141.0, 115.0, 76.0, 55.0, 33.0, 24.0, 10.0, 12.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-67.8125, -66.385498046875, -64.95849609375, -63.531494140625, -62.1044921875, -60.677490234375, -59.25048828125, -57.823486328125, -56.396484375, -54.969482421875, -53.54248046875, -52.115478515625, -50.6884765625, -49.261474609375, -47.83447265625, -46.407470703125, -44.98046875, -43.553466796875, -42.12646484375, -40.699462890625, -39.2724609375, -37.845458984375, -36.41845703125, -34.991455078125, -33.564453125, -32.137451171875, -30.71044921875, -29.283447265625, -27.8564453125, -26.429443359375, -25.00244140625, -23.575439453125, -22.1484375, -20.721435546875, -19.29443359375, -17.867431640625, -16.4404296875, -15.013427734375, -13.58642578125, -12.159423828125, -10.732421875, -9.305419921875, -7.87841796875, -6.451416015625, -5.0244140625, -3.597412109375, -2.17041015625, -0.743408203125, 0.68359375, 2.110595703125, 3.53759765625, 4.964599609375, 6.3916015625, 7.818603515625, 9.24560546875, 10.672607421875, 12.099609375, 13.526611328125, 14.95361328125, 16.380615234375, 17.8076171875, 19.234619140625, 20.66162109375, 22.088623046875, 23.515625]}, "gradients/decoder.model.decoder.layers.8.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 3.0, 6.0, 8.0, 5.0, 9.0, 27.0, 43.0, 53.0, 98.0, 207.0, 501.0, 1856.0, 15246.0, 739702.0, 3375750.0, 55328.0, 3983.0, 789.0, 294.0, 145.0, 74.0, 52.0, 24.0, 25.0, 16.0, 7.0, 7.0, 10.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.09375, -39.6865234375, -38.279296875, -36.8720703125, -35.46484375, -34.0576171875, -32.650390625, -31.2431640625, -29.8359375, -28.4287109375, -27.021484375, -25.6142578125, -24.20703125, -22.7998046875, -21.392578125, -19.9853515625, -18.578125, -17.1708984375, -15.763671875, -14.3564453125, -12.94921875, -11.5419921875, -10.134765625, -8.7275390625, -7.3203125, -5.9130859375, -4.505859375, -3.0986328125, -1.69140625, -0.2841796875, 1.123046875, 2.5302734375, 3.9375, 5.3447265625, 6.751953125, 8.1591796875, 9.56640625, 10.9736328125, 12.380859375, 13.7880859375, 15.1953125, 16.6025390625, 18.009765625, 19.4169921875, 20.82421875, 22.2314453125, 23.638671875, 25.0458984375, 26.453125, 27.8603515625, 29.267578125, 30.6748046875, 32.08203125, 33.4892578125, 34.896484375, 36.3037109375, 37.7109375, 39.1181640625, 40.525390625, 41.9326171875, 43.33984375, 44.7470703125, 46.154296875, 47.5615234375, 48.96875]}, "gradients/decoder.model.decoder.layers.8.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 3.0, 5.0, 13.0, 13.0, 27.0, 50.0, 68.0, 96.0, 182.0, 280.0, 447.0, 637.0, 693.0, 596.0, 387.0, 227.0, 126.0, 66.0, 50.0, 36.0, 19.0, 13.0, 6.0, 3.0, 9.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.8984375, -9.582275390625, -9.26611328125, -8.949951171875, -8.6337890625, -8.317626953125, -8.00146484375, -7.685302734375, -7.369140625, -7.052978515625, -6.73681640625, -6.420654296875, -6.1044921875, -5.788330078125, -5.47216796875, -5.156005859375, -4.83984375, -4.523681640625, -4.20751953125, -3.891357421875, -3.5751953125, -3.259033203125, -2.94287109375, -2.626708984375, -2.310546875, -1.994384765625, -1.67822265625, -1.362060546875, -1.0458984375, -0.729736328125, -0.41357421875, -0.097412109375, 0.21875, 0.534912109375, 0.85107421875, 1.167236328125, 1.4833984375, 1.799560546875, 2.11572265625, 2.431884765625, 2.748046875, 3.064208984375, 3.38037109375, 3.696533203125, 4.0126953125, 4.328857421875, 4.64501953125, 4.961181640625, 5.27734375, 5.593505859375, 5.90966796875, 6.225830078125, 6.5419921875, 6.858154296875, 7.17431640625, 7.490478515625, 7.806640625, 8.122802734375, 8.43896484375, 8.755126953125, 9.0712890625, 9.387451171875, 9.70361328125, 10.019775390625, 10.3359375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 7.0, 23.0, 16.0, 40.0, 65.0, 80.0, 107.0, 104.0, 109.0, 121.0, 87.0, 80.0, 57.0, 31.0, 28.0, 12.0, 10.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-50.15424346923828, -49.102474212646484, -48.05070114135742, -46.998931884765625, -45.94715881347656, -44.895389556884766, -43.8436164855957, -42.791847229003906, -41.740074157714844, -40.68830490112305, -39.636531829833984, -38.58476257324219, -37.532989501953125, -36.48122024536133, -35.429447174072266, -34.37767791748047, -33.325904846191406, -32.27413558959961, -31.222362518310547, -30.170591354370117, -29.118820190429688, -28.067049026489258, -27.015277862548828, -25.96350860595703, -24.911739349365234, -23.859968185424805, -22.808197021484375, -21.756425857543945, -20.704654693603516, -19.652883529663086, -18.601112365722656, -17.54934310913086, -16.497570037841797, -15.445798873901367, -14.394027709960938, -13.342256546020508, -12.290485382080078, -11.238714218139648, -10.186944007873535, -9.135172843933105, -8.083401679992676, -7.031630516052246, -5.979859352111816, -4.928088665008545, -3.8763175010681152, -2.8245463371276855, -1.772775650024414, -0.7210044860839844, 0.3307666778564453, 1.3825377225875854, 2.4343087673187256, 3.486079692840576, 4.537850856781006, 5.5896220207214355, 6.641392707824707, 7.693163871765137, 8.744935035705566, 9.796706199645996, 10.848477363586426, 11.900247573852539, 12.952018737792969, 14.003789901733398, 15.055561065673828, 16.107332229614258, 17.159103393554688]}, "gradients/decoder.model.decoder.layers.8.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 11.0, 11.0, 18.0, 19.0, 34.0, 37.0, 51.0, 53.0, 72.0, 88.0, 97.0, 97.0, 79.0, 86.0, 80.0, 62.0, 39.0, 20.0, 22.0, 15.0, 8.0, 3.0, 5.0, 4.0, 2.0, 2.0], "bins": [-58.893341064453125, -57.70150375366211, -56.509666442871094, -55.317832946777344, -54.12599563598633, -52.93415832519531, -51.74232482910156, -50.55048751831055, -49.35865020751953, -48.166812896728516, -46.9749755859375, -45.78314208984375, -44.591304779052734, -43.39946746826172, -42.20763397216797, -41.01579666137695, -39.82395935058594, -38.63212203979492, -37.440284729003906, -36.248451232910156, -35.05661392211914, -33.864776611328125, -32.672943115234375, -31.48110580444336, -30.289268493652344, -29.097431182861328, -27.905595779418945, -26.713760375976562, -25.521923065185547, -24.33008575439453, -23.13825035095215, -21.946414947509766, -20.754579544067383, -19.562744140625, -18.370906829833984, -17.17906951904297, -15.987234115600586, -14.795397758483887, -13.603561401367188, -12.411725044250488, -11.219888687133789, -10.02805233001709, -8.83621597290039, -7.644379615783691, -6.452543258666992, -5.260706901550293, -4.068870544433594, -2.8770341873168945, -1.6851978302001953, -0.4933614730834961, 0.6984748840332031, 1.8903112411499023, 3.0821475982666016, 4.273983955383301, 5.4658203125, 6.657656669616699, 7.849493026733398, 9.041329383850098, 10.233165740966797, 11.425002098083496, 12.616838455200195, 13.808674812316895, 15.000511169433594, 16.19234848022461, 17.384183883666992]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 12.0, 14.0, 35.0, 52.0, 101.0, 299.0, 871.0, 4315.0, 96277.0, 907187.0, 35677.0, 2648.0, 657.0, 214.0, 95.0, 35.0, 26.0, 16.0, 8.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -17.041259765625, -16.62939453125, -16.217529296875, -15.8056640625, -15.393798828125, -14.98193359375, -14.570068359375, -14.158203125, -13.746337890625, -13.33447265625, -12.922607421875, -12.5107421875, -12.098876953125, -11.68701171875, -11.275146484375, -10.86328125, -10.451416015625, -10.03955078125, -9.627685546875, -9.2158203125, -8.803955078125, -8.39208984375, -7.980224609375, -7.568359375, -7.156494140625, -6.74462890625, -6.332763671875, -5.9208984375, -5.509033203125, -5.09716796875, -4.685302734375, -4.2734375, -3.861572265625, -3.44970703125, -3.037841796875, -2.6259765625, -2.214111328125, -1.80224609375, -1.390380859375, -0.978515625, -0.566650390625, -0.15478515625, 0.257080078125, 0.6689453125, 1.080810546875, 1.49267578125, 1.904541015625, 2.31640625, 2.728271484375, 3.14013671875, 3.552001953125, 3.9638671875, 4.375732421875, 4.78759765625, 5.199462890625, 5.611328125, 6.023193359375, 6.43505859375, 6.846923828125, 7.2587890625, 7.670654296875, 8.08251953125, 8.494384765625, 8.90625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 11.0, 18.0, 19.0, 30.0, 47.0, 66.0, 81.0, 102.0, 129.0, 111.0, 102.0, 88.0, 87.0, 42.0, 29.0, 13.0, 17.0, 10.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.71875, -42.8067626953125, -41.894775390625, -40.9827880859375, -40.07080078125, -39.1588134765625, -38.246826171875, -37.3348388671875, -36.4228515625, -35.5108642578125, -34.598876953125, -33.6868896484375, -32.77490234375, -31.8629150390625, -30.950927734375, -30.0389404296875, -29.126953125, -28.2149658203125, -27.302978515625, -26.3909912109375, -25.47900390625, -24.5670166015625, -23.655029296875, -22.7430419921875, -21.8310546875, -20.9190673828125, -20.007080078125, -19.0950927734375, -18.18310546875, -17.2711181640625, -16.359130859375, -15.4471435546875, -14.53515625, -13.6231689453125, -12.711181640625, -11.7991943359375, -10.88720703125, -9.9752197265625, -9.063232421875, -8.1512451171875, -7.2392578125, -6.3272705078125, -5.415283203125, -4.5032958984375, -3.59130859375, -2.6793212890625, -1.767333984375, -0.8553466796875, 0.056640625, 0.9686279296875, 1.880615234375, 2.7926025390625, 3.70458984375, 4.6165771484375, 5.528564453125, 6.4405517578125, 7.3525390625, 8.2645263671875, 9.176513671875, 10.0885009765625, 11.00048828125, 11.9124755859375, 12.824462890625, 13.7364501953125, 14.6484375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 6.0, 6.0, 6.0, 11.0, 14.0, 39.0, 41.0, 66.0, 104.0, 166.0, 256.0, 471.0, 752.0, 1307.0, 2379.0, 4513.0, 8592.0, 17211.0, 35611.0, 76324.0, 158101.0, 263178.0, 235615.0, 126663.0, 59679.0, 28267.0, 13867.0, 6902.0, 3629.0, 1966.0, 1140.0, 617.0, 411.0, 245.0, 139.0, 101.0, 64.0, 35.0, 25.0, 11.0, 9.0, 10.0, 7.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7705078125, -1.7165985107421875, -1.662689208984375, -1.6087799072265625, -1.55487060546875, -1.5009613037109375, -1.447052001953125, -1.3931427001953125, -1.3392333984375, -1.2853240966796875, -1.231414794921875, -1.1775054931640625, -1.12359619140625, -1.0696868896484375, -1.015777587890625, -0.9618682861328125, -0.907958984375, -0.8540496826171875, -0.800140380859375, -0.7462310791015625, -0.69232177734375, -0.6384124755859375, -0.584503173828125, -0.5305938720703125, -0.4766845703125, -0.4227752685546875, -0.368865966796875, -0.3149566650390625, -0.26104736328125, -0.2071380615234375, -0.153228759765625, -0.0993194580078125, -0.04541015625, 0.0084991455078125, 0.062408447265625, 0.1163177490234375, 0.17022705078125, 0.2241363525390625, 0.278045654296875, 0.3319549560546875, 0.3858642578125, 0.4397735595703125, 0.493682861328125, 0.5475921630859375, 0.60150146484375, 0.6554107666015625, 0.709320068359375, 0.7632293701171875, 0.817138671875, 0.8710479736328125, 0.924957275390625, 0.9788665771484375, 1.03277587890625, 1.0866851806640625, 1.140594482421875, 1.1945037841796875, 1.2484130859375, 1.3023223876953125, 1.356231689453125, 1.4101409912109375, 1.46405029296875, 1.5179595947265625, 1.571868896484375, 1.6257781982421875, 1.6796875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 4.0, 9.0, 9.0, 11.0, 11.0, 19.0, 17.0, 26.0, 23.0, 30.0, 26.0, 39.0, 35.0, 33.0, 32.0, 60.0, 59.0, 46.0, 56.0, 44.0, 58.0, 36.0, 41.0, 38.0, 42.0, 30.0, 22.0, 24.0, 24.0, 17.0, 22.0, 11.0, 13.0, 14.0, 5.0, 3.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.40625, -24.58740234375, -23.7685546875, -22.94970703125, -22.130859375, -21.31201171875, -20.4931640625, -19.67431640625, -18.85546875, -18.03662109375, -17.2177734375, -16.39892578125, -15.580078125, -14.76123046875, -13.9423828125, -13.12353515625, -12.3046875, -11.48583984375, -10.6669921875, -9.84814453125, -9.029296875, -8.21044921875, -7.3916015625, -6.57275390625, -5.75390625, -4.93505859375, -4.1162109375, -3.29736328125, -2.478515625, -1.65966796875, -0.8408203125, -0.02197265625, 0.796875, 1.61572265625, 2.4345703125, 3.25341796875, 4.072265625, 4.89111328125, 5.7099609375, 6.52880859375, 7.34765625, 8.16650390625, 8.9853515625, 9.80419921875, 10.623046875, 11.44189453125, 12.2607421875, 13.07958984375, 13.8984375, 14.71728515625, 15.5361328125, 16.35498046875, 17.173828125, 17.99267578125, 18.8115234375, 19.63037109375, 20.44921875, 21.26806640625, 22.0869140625, 22.90576171875, 23.724609375, 24.54345703125, 25.3623046875, 26.18115234375, 27.0]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 3.0, 6.0, 7.0, 14.0, 19.0, 21.0, 19.0, 36.0, 36.0, 72.0, 113.0, 111.0, 225.0, 318.0, 494.0, 920.0, 1849.0, 4144.0, 11769.0, 43054.0, 171328.0, 439026.0, 272186.0, 72392.0, 19082.0, 6018.0, 2350.0, 1155.0, 651.0, 376.0, 236.0, 163.0, 106.0, 78.0, 51.0, 46.0, 22.0, 18.0, 12.0, 10.0, 6.0, 5.0, 11.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.333984375, -0.3240699768066406, -0.31415557861328125, -0.3042411804199219, -0.2943267822265625, -0.2844123840332031, -0.27449798583984375, -0.2645835876464844, -0.254669189453125, -0.24475479125976562, -0.23484039306640625, -0.22492599487304688, -0.2150115966796875, -0.20509719848632812, -0.19518280029296875, -0.18526840209960938, -0.17535400390625, -0.16543960571289062, -0.15552520751953125, -0.14561080932617188, -0.1356964111328125, -0.12578201293945312, -0.11586761474609375, -0.10595321655273438, -0.096038818359375, -0.08612442016601562, -0.07621002197265625, -0.06629562377929688, -0.0563812255859375, -0.046466827392578125, -0.03655242919921875, -0.026638031005859375, -0.0167236328125, -0.006809234619140625, 0.00310516357421875, 0.013019561767578125, 0.0229339599609375, 0.032848358154296875, 0.04276275634765625, 0.052677154541015625, 0.062591552734375, 0.07250595092773438, 0.08242034912109375, 0.09233474731445312, 0.1022491455078125, 0.11216354370117188, 0.12207794189453125, 0.13199234008789062, 0.14190673828125, 0.15182113647460938, 0.16173553466796875, 0.17164993286132812, 0.1815643310546875, 0.19147872924804688, 0.20139312744140625, 0.21130752563476562, 0.221221923828125, 0.23113632202148438, 0.24105072021484375, 0.2509651184082031, 0.2608795166015625, 0.2707939147949219, 0.28070831298828125, 0.2906227111816406, 0.300537109375]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 3.0, 1.0, 4.0, 11.0, 13.0, 14.0, 20.0, 25.0, 27.0, 41.0, 50.0, 54.0, 72.0, 87.0, 97.0, 92.0, 73.0, 71.0, 57.0, 40.0, 40.0, 36.0, 24.0, 14.0, 10.0, 10.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00024890899658203125, -0.00024296343326568604, -0.00023701786994934082, -0.0002310723066329956, -0.0002251267433166504, -0.00021918118000030518, -0.00021323561668395996, -0.00020729005336761475, -0.00020134449005126953, -0.00019539892673492432, -0.0001894533634185791, -0.0001835078001022339, -0.00017756223678588867, -0.00017161667346954346, -0.00016567111015319824, -0.00015972554683685303, -0.0001537799835205078, -0.0001478344202041626, -0.00014188885688781738, -0.00013594329357147217, -0.00012999773025512695, -0.00012405216693878174, -0.00011810660362243652, -0.00011216104030609131, -0.0001062154769897461, -0.00010026991367340088, -9.432435035705566e-05, -8.837878704071045e-05, -8.243322372436523e-05, -7.648766040802002e-05, -7.05420970916748e-05, -6.459653377532959e-05, -5.8650970458984375e-05, -5.270540714263916e-05, -4.6759843826293945e-05, -4.081428050994873e-05, -3.4868717193603516e-05, -2.89231538772583e-05, -2.2977590560913086e-05, -1.703202724456787e-05, -1.1086463928222656e-05, -5.140900611877441e-06, 8.046627044677734e-07, 6.750226020812988e-06, 1.2695789337158203e-05, 1.8641352653503418e-05, 2.4586915969848633e-05, 3.053247928619385e-05, 3.647804260253906e-05, 4.242360591888428e-05, 4.836916923522949e-05, 5.431473255157471e-05, 6.026029586791992e-05, 6.620585918426514e-05, 7.215142250061035e-05, 7.809698581695557e-05, 8.404254913330078e-05, 8.9988112449646e-05, 9.593367576599121e-05, 0.00010187923908233643, 0.00010782480239868164, 0.00011377036571502686, 0.00011971592903137207, 0.00012566149234771729, 0.0001316070556640625]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 4.0, 3.0, 9.0, 17.0, 14.0, 25.0, 33.0, 46.0, 82.0, 128.0, 219.0, 408.0, 757.0, 1982.0, 6066.0, 22300.0, 99270.0, 386126.0, 394902.0, 102884.0, 23337.0, 6148.0, 2048.0, 807.0, 387.0, 196.0, 109.0, 82.0, 64.0, 22.0, 23.0, 21.0, 7.0, 6.0, 5.0, 7.0, 4.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.331298828125, -0.3209495544433594, -0.31060028076171875, -0.3002510070800781, -0.2899017333984375, -0.2795524597167969, -0.26920318603515625, -0.2588539123535156, -0.248504638671875, -0.23815536499023438, -0.22780609130859375, -0.21745681762695312, -0.2071075439453125, -0.19675827026367188, -0.18640899658203125, -0.17605972290039062, -0.16571044921875, -0.15536117553710938, -0.14501190185546875, -0.13466262817382812, -0.1243133544921875, -0.11396408081054688, -0.10361480712890625, -0.09326553344726562, -0.082916259765625, -0.07256698608398438, -0.06221771240234375, -0.051868438720703125, -0.0415191650390625, -0.031169891357421875, -0.02082061767578125, -0.010471343994140625, -0.0001220703125, 0.010227203369140625, 0.02057647705078125, 0.030925750732421875, 0.0412750244140625, 0.051624298095703125, 0.06197357177734375, 0.07232284545898438, 0.082672119140625, 0.09302139282226562, 0.10337066650390625, 0.11371994018554688, 0.1240692138671875, 0.13441848754882812, 0.14476776123046875, 0.15511703491210938, 0.16546630859375, 0.17581558227539062, 0.18616485595703125, 0.19651412963867188, 0.2068634033203125, 0.21721267700195312, 0.22756195068359375, 0.23791122436523438, 0.248260498046875, 0.2586097717285156, 0.26895904541015625, 0.2793083190917969, 0.2896575927734375, 0.3000068664550781, 0.31035614013671875, 0.3207054138183594, 0.3310546875]}, "gradients/decoder.model.decoder.layers.8.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 1.0, 5.0, 4.0, 7.0, 9.0, 19.0, 21.0, 28.0, 35.0, 32.0, 58.0, 53.0, 67.0, 68.0, 79.0, 63.0, 68.0, 49.0, 72.0, 67.0, 46.0, 42.0, 21.0, 21.0, 13.0, 9.0, 11.0, 6.0, 6.0, 10.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.10430908203125, -0.1014871597290039, -0.09866523742675781, -0.09584331512451172, -0.09302139282226562, -0.09019947052001953, -0.08737754821777344, -0.08455562591552734, -0.08173370361328125, -0.07891178131103516, -0.07608985900878906, -0.07326793670654297, -0.07044601440429688, -0.06762409210205078, -0.06480216979980469, -0.061980247497558594, -0.0591583251953125, -0.056336402893066406, -0.05351448059082031, -0.05069255828857422, -0.047870635986328125, -0.04504871368408203, -0.04222679138183594, -0.039404869079589844, -0.03658294677734375, -0.033761024475097656, -0.030939102172851562, -0.02811717987060547, -0.025295257568359375, -0.02247333526611328, -0.019651412963867188, -0.016829490661621094, -0.014007568359375, -0.011185646057128906, -0.008363723754882812, -0.005541801452636719, -0.002719879150390625, 0.00010204315185546875, 0.0029239654541015625, 0.005745887756347656, 0.00856781005859375, 0.011389732360839844, 0.014211654663085938, 0.01703357696533203, 0.019855499267578125, 0.02267742156982422, 0.025499343872070312, 0.028321266174316406, 0.0311431884765625, 0.033965110778808594, 0.03678703308105469, 0.03960895538330078, 0.042430877685546875, 0.04525279998779297, 0.04807472229003906, 0.050896644592285156, 0.05371856689453125, 0.056540489196777344, 0.05936241149902344, 0.06218433380126953, 0.06500625610351562, 0.06782817840576172, 0.07065010070800781, 0.0734720230102539, 0.0762939453125]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 1.0, 6.0, 8.0, 15.0, 27.0, 27.0, 60.0, 78.0, 85.0, 120.0, 121.0, 117.0, 99.0, 69.0, 58.0, 41.0, 29.0, 9.0, 13.0, 8.0, 3.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-27.18111228942871, -26.56928825378418, -25.95746421813965, -25.345640182495117, -24.73381805419922, -24.121994018554688, -23.510169982910156, -22.898345947265625, -22.286521911621094, -21.674697875976562, -21.06287384033203, -20.4510498046875, -19.83922576904297, -19.22740364074707, -18.61557960510254, -18.003755569458008, -17.391931533813477, -16.780107498168945, -16.168283462524414, -15.5564603805542, -14.944636344909668, -14.332812309265137, -13.720989227294922, -13.10916519165039, -12.49734115600586, -11.885517120361328, -11.273693084716797, -10.661870002746582, -10.05004596710205, -9.43822193145752, -8.826398849487305, -8.214574813842773, -7.602748870849609, -6.990924835205078, -6.379101276397705, -5.767277717590332, -5.155453681945801, -4.5436296463012695, -3.9318060874938965, -3.3199825286865234, -2.708158493041992, -2.09633469581604, -1.484510898590088, -0.8726871013641357, -0.2608633041381836, 0.35096049308776855, 0.9627842903137207, 1.5746078491210938, 2.186431884765625, 2.798255681991577, 3.4100794792175293, 4.021903038024902, 4.633727073669434, 5.245551109313965, 5.857374668121338, 6.469198226928711, 7.081022262573242, 7.692846298217773, 8.304670333862305, 8.91649341583252, 9.52831745147705, 10.140141487121582, 10.751964569091797, 11.363788604736328, 11.97561264038086]}, "gradients/decoder.model.decoder.layers.8.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 6.0, 10.0, 18.0, 21.0, 34.0, 51.0, 54.0, 87.0, 105.0, 109.0, 122.0, 106.0, 106.0, 71.0, 45.0, 26.0, 16.0, 13.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0], "bins": [-43.572532653808594, -42.681766510009766, -41.79099655151367, -40.900230407714844, -40.00946044921875, -39.11869430541992, -38.22792434692383, -37.337158203125, -36.446388244628906, -35.55562210083008, -34.664852142333984, -33.774085998535156, -32.88331604003906, -31.992549896240234, -31.101781845092773, -30.211013793945312, -29.320247650146484, -28.429479598999023, -27.538711547851562, -26.6479434967041, -25.75717544555664, -24.866409301757812, -23.97564125061035, -23.08487319946289, -22.19410514831543, -21.30333709716797, -20.412569046020508, -19.521800994873047, -18.63103485107422, -17.740264892578125, -16.849498748779297, -15.958730697631836, -15.067964553833008, -14.177196502685547, -13.286428451538086, -12.395661354064941, -11.50489330291748, -10.61412525177002, -9.723358154296875, -8.832590103149414, -7.941822052001953, -7.051054000854492, -6.1602864265441895, -5.269518852233887, -4.378750801086426, -3.487982749938965, -2.597215175628662, -1.7064476013183594, -0.8156795501708984, 0.0750882625579834, 0.9658560752868652, 1.856623888015747, 2.747391700744629, 3.63815975189209, 4.528927326202393, 5.419694900512695, 6.310462951660156, 7.201231002807617, 8.091999053955078, 8.982766151428223, 9.873534202575684, 10.764302253723145, 11.655069351196289, 12.54583740234375, 13.436605453491211]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 14.0, 21.0, 32.0, 55.0, 117.0, 207.0, 483.0, 1089.0, 3062.0, 9104.0, 32723.0, 122807.0, 383161.0, 349319.0, 105529.0, 28352.0, 8060.0, 2602.0, 965.0, 395.0, 190.0, 109.0, 62.0, 30.0, 25.0, 17.0, 9.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3125, -11.8870849609375, -11.461669921875, -11.0362548828125, -10.61083984375, -10.1854248046875, -9.760009765625, -9.3345947265625, -8.9091796875, -8.4837646484375, -8.058349609375, -7.6329345703125, -7.20751953125, -6.7821044921875, -6.356689453125, -5.9312744140625, -5.505859375, -5.0804443359375, -4.655029296875, -4.2296142578125, -3.80419921875, -3.3787841796875, -2.953369140625, -2.5279541015625, -2.1025390625, -1.6771240234375, -1.251708984375, -0.8262939453125, -0.40087890625, 0.0245361328125, 0.449951171875, 0.8753662109375, 1.30078125, 1.7261962890625, 2.151611328125, 2.5770263671875, 3.00244140625, 3.4278564453125, 3.853271484375, 4.2786865234375, 4.7041015625, 5.1295166015625, 5.554931640625, 5.9803466796875, 6.40576171875, 6.8311767578125, 7.256591796875, 7.6820068359375, 8.107421875, 8.5328369140625, 8.958251953125, 9.3836669921875, 9.80908203125, 10.2344970703125, 10.659912109375, 11.0853271484375, 11.5107421875, 11.9361572265625, 12.361572265625, 12.7869873046875, 13.21240234375, 13.6378173828125, 14.063232421875, 14.4886474609375, 14.9140625]}, "gradients/decoder.model.decoder.layers.8.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 7.0, 6.0, 4.0, 11.0, 19.0, 8.0, 31.0, 35.0, 33.0, 56.0, 76.0, 67.0, 90.0, 87.0, 82.0, 80.0, 77.0, 66.0, 50.0, 46.0, 30.0, 13.0, 15.0, 12.0, 1.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0], "bins": [-55.9375, -54.737548828125, -53.53759765625, -52.337646484375, -51.1376953125, -49.937744140625, -48.73779296875, -47.537841796875, -46.337890625, -45.137939453125, -43.93798828125, -42.738037109375, -41.5380859375, -40.338134765625, -39.13818359375, -37.938232421875, -36.73828125, -35.538330078125, -34.33837890625, -33.138427734375, -31.9384765625, -30.738525390625, -29.53857421875, -28.338623046875, -27.138671875, -25.938720703125, -24.73876953125, -23.538818359375, -22.3388671875, -21.138916015625, -19.93896484375, -18.739013671875, -17.5390625, -16.339111328125, -15.13916015625, -13.939208984375, -12.7392578125, -11.539306640625, -10.33935546875, -9.139404296875, -7.939453125, -6.739501953125, -5.53955078125, -4.339599609375, -3.1396484375, -1.939697265625, -0.73974609375, 0.460205078125, 1.66015625, 2.860107421875, 4.06005859375, 5.260009765625, 6.4599609375, 7.659912109375, 8.85986328125, 10.059814453125, 11.259765625, 12.459716796875, 13.65966796875, 14.859619140625, 16.0595703125, 17.259521484375, 18.45947265625, 19.659423828125, 20.859375]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 6.0, 7.0, 12.0, 10.0, 17.0, 16.0, 13.0, 21.0, 23.0, 17.0, 26.0, 35.0, 57.0, 61.0, 108.0, 221.0, 613.0, 19994.0, 1008067.0, 17960.0, 569.0, 206.0, 126.0, 71.0, 47.0, 32.0, 35.0, 28.0, 24.0, 24.0, 15.0, 19.0, 12.0, 6.0, 11.0, 11.0, 10.0, 7.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.4375, -60.3203125, -58.203125, -56.0859375, -53.96875, -51.8515625, -49.734375, -47.6171875, -45.5, -43.3828125, -41.265625, -39.1484375, -37.03125, -34.9140625, -32.796875, -30.6796875, -28.5625, -26.4453125, -24.328125, -22.2109375, -20.09375, -17.9765625, -15.859375, -13.7421875, -11.625, -9.5078125, -7.390625, -5.2734375, -3.15625, -1.0390625, 1.078125, 3.1953125, 5.3125, 7.4296875, 9.546875, 11.6640625, 13.78125, 15.8984375, 18.015625, 20.1328125, 22.25, 24.3671875, 26.484375, 28.6015625, 30.71875, 32.8359375, 34.953125, 37.0703125, 39.1875, 41.3046875, 43.421875, 45.5390625, 47.65625, 49.7734375, 51.890625, 54.0078125, 56.125, 58.2421875, 60.359375, 62.4765625, 64.59375, 66.7109375, 68.828125, 70.9453125, 73.0625]}, "gradients/decoder.model.decoder.layers.8.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 3.0, 7.0, 6.0, 1.0, 4.0, 10.0, 9.0, 10.0, 16.0, 16.0, 23.0, 20.0, 19.0, 23.0, 30.0, 46.0, 35.0, 35.0, 42.0, 45.0, 46.0, 49.0, 46.0, 47.0, 63.0, 32.0, 35.0, 36.0, 35.0, 40.0, 30.0, 25.0, 22.0, 19.0, 15.0, 15.0, 11.0, 7.0, 10.0, 9.0, 10.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.703125, -22.958251953125, -22.21337890625, -21.468505859375, -20.7236328125, -19.978759765625, -19.23388671875, -18.489013671875, -17.744140625, -16.999267578125, -16.25439453125, -15.509521484375, -14.7646484375, -14.019775390625, -13.27490234375, -12.530029296875, -11.78515625, -11.040283203125, -10.29541015625, -9.550537109375, -8.8056640625, -8.060791015625, -7.31591796875, -6.571044921875, -5.826171875, -5.081298828125, -4.33642578125, -3.591552734375, -2.8466796875, -2.101806640625, -1.35693359375, -0.612060546875, 0.1328125, 0.877685546875, 1.62255859375, 2.367431640625, 3.1123046875, 3.857177734375, 4.60205078125, 5.346923828125, 6.091796875, 6.836669921875, 7.58154296875, 8.326416015625, 9.0712890625, 9.816162109375, 10.56103515625, 11.305908203125, 12.05078125, 12.795654296875, 13.54052734375, 14.285400390625, 15.0302734375, 15.775146484375, 16.52001953125, 17.264892578125, 18.009765625, 18.754638671875, 19.49951171875, 20.244384765625, 20.9892578125, 21.734130859375, 22.47900390625, 23.223876953125, 23.96875]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 5.0, 6.0, 17.0, 10.0, 23.0, 53.0, 162.0, 508.0, 2264.0, 22647.0, 921839.0, 95651.0, 4161.0, 757.0, 243.0, 94.0, 39.0, 20.0, 19.0, 8.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.7109375, -15.2442626953125, -14.777587890625, -14.3109130859375, -13.84423828125, -13.3775634765625, -12.910888671875, -12.4442138671875, -11.9775390625, -11.5108642578125, -11.044189453125, -10.5775146484375, -10.11083984375, -9.6441650390625, -9.177490234375, -8.7108154296875, -8.244140625, -7.7774658203125, -7.310791015625, -6.8441162109375, -6.37744140625, -5.9107666015625, -5.444091796875, -4.9774169921875, -4.5107421875, -4.0440673828125, -3.577392578125, -3.1107177734375, -2.64404296875, -2.1773681640625, -1.710693359375, -1.2440185546875, -0.77734375, -0.3106689453125, 0.156005859375, 0.6226806640625, 1.08935546875, 1.5560302734375, 2.022705078125, 2.4893798828125, 2.9560546875, 3.4227294921875, 3.889404296875, 4.3560791015625, 4.82275390625, 5.2894287109375, 5.756103515625, 6.2227783203125, 6.689453125, 7.1561279296875, 7.622802734375, 8.0894775390625, 8.55615234375, 9.0228271484375, 9.489501953125, 9.9561767578125, 10.4228515625, 10.8895263671875, 11.356201171875, 11.8228759765625, 12.28955078125, 12.7562255859375, 13.222900390625, 13.6895751953125, 14.15625]}, "gradients/decoder.model.decoder.layers.8.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 6.0, 7.0, 10.0, 14.0, 27.0, 32.0, 30.0, 49.0, 75.0, 79.0, 83.0, 101.0, 109.0, 87.0, 77.0, 49.0, 40.0, 35.0, 27.0, 20.0, 9.0, 11.0, 5.0, 8.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007228851318359375, -0.0006978586316108704, -0.0006728321313858032, -0.0006478056311607361, -0.0006227791309356689, -0.0005977526307106018, -0.0005727261304855347, -0.0005476996302604675, -0.0005226731300354004, -0.0004976466298103333, -0.0004726201295852661, -0.000447593629360199, -0.00042256712913513184, -0.0003975406289100647, -0.00037251412868499756, -0.0003474876284599304, -0.0003224611282348633, -0.00029743462800979614, -0.000272408127784729, -0.00024738162755966187, -0.00022235512733459473, -0.0001973286271095276, -0.00017230212688446045, -0.0001472756266593933, -0.00012224912643432617, -9.722262620925903e-05, -7.21961259841919e-05, -4.7169625759124756e-05, -2.2143125534057617e-05, 2.8833746910095215e-06, 2.790987491607666e-05, 5.29363751411438e-05, 7.796287536621094e-05, 0.00010298937559127808, 0.00012801587581634521, 0.00015304237604141235, 0.0001780688762664795, 0.00020309537649154663, 0.00022812187671661377, 0.0002531483769416809, 0.00027817487716674805, 0.0003032013773918152, 0.0003282278776168823, 0.00035325437784194946, 0.0003782808780670166, 0.00040330737829208374, 0.0004283338785171509, 0.000453360378742218, 0.00047838687896728516, 0.0005034133791923523, 0.0005284398794174194, 0.0005534663796424866, 0.0005784928798675537, 0.0006035193800926208, 0.000628545880317688, 0.0006535723805427551, 0.0006785988807678223, 0.0007036253809928894, 0.0007286518812179565, 0.0007536783814430237, 0.0007787048816680908, 0.000803731381893158, 0.0008287578821182251, 0.0008537843823432922, 0.0008788108825683594]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 8.0, 9.0, 20.0, 31.0, 43.0, 93.0, 145.0, 359.0, 1376.0, 8744.0, 201677.0, 790879.0, 40203.0, 3556.0, 836.0, 269.0, 122.0, 63.0, 31.0, 21.0, 19.0, 11.0, 5.0, 5.0, 3.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.921875, -10.58349609375, -10.2451171875, -9.90673828125, -9.568359375, -9.22998046875, -8.8916015625, -8.55322265625, -8.21484375, -7.87646484375, -7.5380859375, -7.19970703125, -6.861328125, -6.52294921875, -6.1845703125, -5.84619140625, -5.5078125, -5.16943359375, -4.8310546875, -4.49267578125, -4.154296875, -3.81591796875, -3.4775390625, -3.13916015625, -2.80078125, -2.46240234375, -2.1240234375, -1.78564453125, -1.447265625, -1.10888671875, -0.7705078125, -0.43212890625, -0.09375, 0.24462890625, 0.5830078125, 0.92138671875, 1.259765625, 1.59814453125, 1.9365234375, 2.27490234375, 2.61328125, 2.95166015625, 3.2900390625, 3.62841796875, 3.966796875, 4.30517578125, 4.6435546875, 4.98193359375, 5.3203125, 5.65869140625, 5.9970703125, 6.33544921875, 6.673828125, 7.01220703125, 7.3505859375, 7.68896484375, 8.02734375, 8.36572265625, 8.7041015625, 9.04248046875, 9.380859375, 9.71923828125, 10.0576171875, 10.39599609375, 10.734375]}, "gradients/decoder.model.decoder.layers.8.self_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 6.0, 3.0, 5.0, 11.0, 10.0, 22.0, 23.0, 32.0, 57.0, 58.0, 79.0, 109.0, 109.0, 100.0, 83.0, 75.0, 65.0, 52.0, 29.0, 18.0, 22.0, 12.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.720458984375, -1.63818359375, -1.555908203125, -1.4736328125, -1.391357421875, -1.30908203125, -1.226806640625, -1.14453125, -1.062255859375, -0.97998046875, -0.897705078125, -0.8154296875, -0.733154296875, -0.65087890625, -0.568603515625, -0.486328125, -0.404052734375, -0.32177734375, -0.239501953125, -0.1572265625, -0.074951171875, 0.00732421875, 0.089599609375, 0.171875, 0.254150390625, 0.33642578125, 0.418701171875, 0.5009765625, 0.583251953125, 0.66552734375, 0.747802734375, 0.830078125, 0.912353515625, 0.99462890625, 1.076904296875, 1.1591796875, 1.241455078125, 1.32373046875, 1.406005859375, 1.48828125, 1.570556640625, 1.65283203125, 1.735107421875, 1.8173828125, 1.899658203125, 1.98193359375, 2.064208984375, 2.146484375, 2.228759765625, 2.31103515625, 2.393310546875, 2.4755859375, 2.557861328125, 2.64013671875, 2.722412109375, 2.8046875, 2.886962890625, 2.96923828125, 3.051513671875, 3.1337890625, 3.216064453125, 3.29833984375, 3.380615234375, 3.462890625]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 8.0, 16.0, 34.0, 68.0, 129.0, 205.0, 216.0, 156.0, 88.0, 48.0, 22.0, 4.0, 6.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-92.15776062011719, -89.96730041503906, -87.7768325805664, -85.58636474609375, -83.39590454101562, -81.2054443359375, -79.01497650146484, -76.82450866699219, -74.63404846191406, -72.44358825683594, -70.25312042236328, -68.06265258789062, -65.8721923828125, -63.68172836303711, -61.49126434326172, -59.30080032348633, -57.11033630371094, -54.91987228393555, -52.729408264160156, -50.538944244384766, -48.348480224609375, -46.158016204833984, -43.967552185058594, -41.7770881652832, -39.58662414550781, -37.39616012573242, -35.20569610595703, -33.01523208618164, -30.82476806640625, -28.63430404663086, -26.44384002685547, -24.253376007080078, -22.06291961669922, -19.872455596923828, -17.681991577148438, -15.491527557373047, -13.301063537597656, -11.110599517822266, -8.920135498046875, -6.729671478271484, -4.539207458496094, -2.348743438720703, -0.1582794189453125, 2.032184600830078, 4.222648620605469, 6.413112640380859, 8.60357666015625, 10.79404067993164, 12.984504699707031, 15.174968719482422, 17.365432739257812, 19.555896759033203, 21.746360778808594, 23.936824798583984, 26.127288818359375, 28.317752838134766, 30.508216857910156, 32.69868087768555, 34.88914489746094, 37.07960891723633, 39.27007293701172, 41.46053695678711, 43.6510009765625, 45.84146499633789, 48.03192901611328]}, "gradients/decoder.model.decoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 4.0, 13.0, 16.0, 10.0, 21.0, 16.0, 34.0, 38.0, 48.0, 57.0, 61.0, 68.0, 53.0, 63.0, 66.0, 61.0, 61.0, 62.0, 61.0, 35.0, 37.0, 31.0, 30.0, 18.0, 16.0, 12.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-70.88099670410156, -69.05985260009766, -67.23870086669922, -65.41755676269531, -63.596405029296875, -61.77526092529297, -59.9541130065918, -58.132965087890625, -56.31181716918945, -54.49066925048828, -52.66952133178711, -50.84837341308594, -49.02722930908203, -47.206077575683594, -45.38493347167969, -43.563785552978516, -41.742637634277344, -39.92148971557617, -38.100341796875, -36.27919387817383, -34.458045959472656, -32.63690185546875, -30.815753936767578, -28.994606018066406, -27.173458099365234, -25.352310180664062, -23.53116226196289, -21.71001625061035, -19.88886833190918, -18.067720413208008, -16.24657440185547, -14.425426483154297, -12.604278564453125, -10.783130645751953, -8.961983680725098, -7.140836238861084, -5.31968879699707, -3.4985408782958984, -1.677393913269043, 0.1437530517578125, 1.9649009704589844, 3.786048412322998, 5.607195854187012, 7.428343296051025, 9.249490737915039, 11.070638656616211, 12.891785621643066, 14.712932586669922, 16.534080505371094, 18.355228424072266, 20.176376342773438, 21.997522354125977, 23.81867027282715, 25.63981819152832, 27.46096420288086, 29.28211212158203, 31.103260040283203, 32.924407958984375, 34.74555587768555, 36.56670379638672, 38.387847900390625, 40.20899963378906, 42.03014373779297, 43.85129165649414, 45.67243957519531]}, "gradients/decoder.model.decoder.layers.7.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 10.0, 7.0, 19.0, 24.0, 42.0, 49.0, 65.0, 90.0, 120.0, 180.0, 275.0, 517.0, 1106.0, 4614.0, 35615.0, 442304.0, 2556358.0, 1046289.0, 91679.0, 9960.0, 2872.0, 1079.0, 392.0, 187.0, 119.0, 82.0, 63.0, 48.0, 29.0, 18.0, 17.0, 12.0, 8.0, 12.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.875, -31.006103515625, -30.13720703125, -29.268310546875, -28.3994140625, -27.530517578125, -26.66162109375, -25.792724609375, -24.923828125, -24.054931640625, -23.18603515625, -22.317138671875, -21.4482421875, -20.579345703125, -19.71044921875, -18.841552734375, -17.97265625, -17.103759765625, -16.23486328125, -15.365966796875, -14.4970703125, -13.628173828125, -12.75927734375, -11.890380859375, -11.021484375, -10.152587890625, -9.28369140625, -8.414794921875, -7.5458984375, -6.677001953125, -5.80810546875, -4.939208984375, -4.0703125, -3.201416015625, -2.33251953125, -1.463623046875, -0.5947265625, 0.274169921875, 1.14306640625, 2.011962890625, 2.880859375, 3.749755859375, 4.61865234375, 5.487548828125, 6.3564453125, 7.225341796875, 8.09423828125, 8.963134765625, 9.83203125, 10.700927734375, 11.56982421875, 12.438720703125, 13.3076171875, 14.176513671875, 15.04541015625, 15.914306640625, 16.783203125, 17.652099609375, 18.52099609375, 19.389892578125, 20.2587890625, 21.127685546875, 21.99658203125, 22.865478515625, 23.734375]}, "gradients/decoder.model.decoder.layers.7.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 9.0, 16.0, 21.0, 21.0, 18.0, 40.0, 39.0, 58.0, 63.0, 75.0, 80.0, 86.0, 79.0, 81.0, 76.0, 65.0, 58.0, 46.0, 24.0, 19.0, 8.0, 5.0, 5.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-38.5, -37.634765625, -36.76953125, -35.904296875, -35.0390625, -34.173828125, -33.30859375, -32.443359375, -31.578125, -30.712890625, -29.84765625, -28.982421875, -28.1171875, -27.251953125, -26.38671875, -25.521484375, -24.65625, -23.791015625, -22.92578125, -22.060546875, -21.1953125, -20.330078125, -19.46484375, -18.599609375, -17.734375, -16.869140625, -16.00390625, -15.138671875, -14.2734375, -13.408203125, -12.54296875, -11.677734375, -10.8125, -9.947265625, -9.08203125, -8.216796875, -7.3515625, -6.486328125, -5.62109375, -4.755859375, -3.890625, -3.025390625, -2.16015625, -1.294921875, -0.4296875, 0.435546875, 1.30078125, 2.166015625, 3.03125, 3.896484375, 4.76171875, 5.626953125, 6.4921875, 7.357421875, 8.22265625, 9.087890625, 9.953125, 10.818359375, 11.68359375, 12.548828125, 13.4140625, 14.279296875, 15.14453125, 16.009765625, 16.875]}, "gradients/decoder.model.decoder.layers.7.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 13.0, 11.0, 18.0, 28.0, 44.0, 81.0, 141.0, 418.0, 1870.0, 61622.0, 4059132.0, 68268.0, 1857.0, 408.0, 167.0, 82.0, 59.0, 21.0, 21.0, 10.0, 9.0, 0.0, 5.0, 1.0, 2.0, 0.0, 1.0], "bins": [-89.3125, -87.4326171875, -85.552734375, -83.6728515625, -81.79296875, -79.9130859375, -78.033203125, -76.1533203125, -74.2734375, -72.3935546875, -70.513671875, -68.6337890625, -66.75390625, -64.8740234375, -62.994140625, -61.1142578125, -59.234375, -57.3544921875, -55.474609375, -53.5947265625, -51.71484375, -49.8349609375, -47.955078125, -46.0751953125, -44.1953125, -42.3154296875, -40.435546875, -38.5556640625, -36.67578125, -34.7958984375, -32.916015625, -31.0361328125, -29.15625, -27.2763671875, -25.396484375, -23.5166015625, -21.63671875, -19.7568359375, -17.876953125, -15.9970703125, -14.1171875, -12.2373046875, -10.357421875, -8.4775390625, -6.59765625, -4.7177734375, -2.837890625, -0.9580078125, 0.921875, 2.8017578125, 4.681640625, 6.5615234375, 8.44140625, 10.3212890625, 12.201171875, 14.0810546875, 15.9609375, 17.8408203125, 19.720703125, 21.6005859375, 23.48046875, 25.3603515625, 27.240234375, 29.1201171875, 31.0]}, "gradients/decoder.model.decoder.layers.7.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 3.0, 1.0, 3.0, 6.0, 4.0, 13.0, 14.0, 22.0, 33.0, 33.0, 63.0, 84.0, 133.0, 177.0, 231.0, 358.0, 426.0, 503.0, 523.0, 441.0, 304.0, 223.0, 137.0, 118.0, 67.0, 51.0, 24.0, 16.0, 19.0, 19.0, 10.0, 4.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.62890625, -4.42596435546875, -4.2230224609375, -4.02008056640625, -3.817138671875, -3.61419677734375, -3.4112548828125, -3.20831298828125, -3.00537109375, -2.80242919921875, -2.5994873046875, -2.39654541015625, -2.193603515625, -1.99066162109375, -1.7877197265625, -1.58477783203125, -1.3818359375, -1.17889404296875, -0.9759521484375, -0.77301025390625, -0.570068359375, -0.36712646484375, -0.1641845703125, 0.03875732421875, 0.24169921875, 0.44464111328125, 0.6475830078125, 0.85052490234375, 1.053466796875, 1.25640869140625, 1.4593505859375, 1.66229248046875, 1.865234375, 2.06817626953125, 2.2711181640625, 2.47406005859375, 2.677001953125, 2.87994384765625, 3.0828857421875, 3.28582763671875, 3.48876953125, 3.69171142578125, 3.8946533203125, 4.09759521484375, 4.300537109375, 4.50347900390625, 4.7064208984375, 4.90936279296875, 5.1123046875, 5.31524658203125, 5.5181884765625, 5.72113037109375, 5.924072265625, 6.12701416015625, 6.3299560546875, 6.53289794921875, 6.73583984375, 6.93878173828125, 7.1417236328125, 7.34466552734375, 7.547607421875, 7.75054931640625, 7.9534912109375, 8.15643310546875, 8.359375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 10.0, 32.0, 26.0, 38.0, 39.0, 59.0, 73.0, 62.0, 89.0, 80.0, 94.0, 92.0, 70.0, 68.0, 52.0, 36.0, 21.0, 11.0, 20.0, 6.0, 5.0, 3.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.05757522583008, -32.29737091064453, -31.537168502807617, -30.776966094970703, -30.01676368713379, -29.256561279296875, -28.496356964111328, -27.736154556274414, -26.9759521484375, -26.215749740600586, -25.45554542541504, -24.695343017578125, -23.93514060974121, -23.174938201904297, -22.41473388671875, -21.654531478881836, -20.89432716369629, -20.134124755859375, -19.373920440673828, -18.613718032836914, -17.853515625, -17.093311309814453, -16.33310890197754, -15.572906494140625, -14.812703132629395, -14.052499771118164, -13.29229736328125, -12.53209400177002, -11.771890640258789, -11.011688232421875, -10.251484870910645, -9.491281509399414, -8.7310791015625, -7.970876216888428, -7.2106733322143555, -6.450469970703125, -5.690267086029053, -4.9300642013549805, -4.16986083984375, -3.4096579551696777, -2.6494550704956055, -1.8892520666122437, -1.1290490627288818, -0.36884593963623047, 0.3913569450378418, 1.151559829711914, 1.9117631912231445, 2.671966075897217, 3.432168960571289, 4.192371845245361, 4.952574729919434, 5.712778091430664, 6.472980976104736, 7.233183860778809, 7.993387222290039, 8.753589630126953, 9.513792991638184, 10.273996353149414, 11.034198760986328, 11.794402122497559, 12.554605484008789, 13.314807891845703, 14.075011253356934, 14.835214614868164, 15.595417022705078]}, "gradients/decoder.model.decoder.layers.7.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 8.0, 16.0, 12.0, 15.0, 23.0, 34.0, 27.0, 46.0, 55.0, 65.0, 59.0, 63.0, 76.0, 76.0, 76.0, 80.0, 67.0, 56.0, 41.0, 32.0, 29.0, 19.0, 14.0, 4.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-39.191429138183594, -38.29949951171875, -37.40757369995117, -36.51564407348633, -35.623714447021484, -34.731788635253906, -33.83985900878906, -32.94792938232422, -32.055999755859375, -31.164072036743164, -30.27214241027832, -29.38021469116211, -28.488285064697266, -27.596357345581055, -26.704429626464844, -25.8125, -24.920574188232422, -24.02864646911621, -23.136716842651367, -22.244789123535156, -21.352859497070312, -20.4609317779541, -19.56900405883789, -18.677074432373047, -17.785144805908203, -16.893217086791992, -16.00128746032715, -15.109359741210938, -14.21743106842041, -13.325502395629883, -12.433573722839355, -11.541645050048828, -10.649717330932617, -9.75778865814209, -8.865859985351562, -7.973931789398193, -7.082003593444824, -6.190074920654297, -5.2981462478637695, -4.4062180519104, -3.514289379119873, -2.622360944747925, -1.730432391166687, -0.8385038375854492, 0.05342459678649902, 0.9453530311584473, 1.8372817039489746, 2.7292098999023438, 3.621138572692871, 4.513067245483398, 5.404995441436768, 6.296924114227295, 7.188852310180664, 8.080780982971191, 8.972709655761719, 9.86463737487793, 10.756567001342773, 11.6484956741333, 12.540424346923828, 13.432352066040039, 14.324280738830566, 15.216209411621094, 16.108139038085938, 17.00006675720215, 17.89199447631836]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 4.0, 5.0, 13.0, 19.0, 22.0, 35.0, 58.0, 101.0, 166.0, 358.0, 1172.0, 8866.0, 162569.0, 803421.0, 65668.0, 4666.0, 777.0, 294.0, 144.0, 86.0, 46.0, 27.0, 11.0, 16.0, 6.0, 4.0, 2.0, 0.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8125, -8.531494140625, -8.25048828125, -7.969482421875, -7.6884765625, -7.407470703125, -7.12646484375, -6.845458984375, -6.564453125, -6.283447265625, -6.00244140625, -5.721435546875, -5.4404296875, -5.159423828125, -4.87841796875, -4.597412109375, -4.31640625, -4.035400390625, -3.75439453125, -3.473388671875, -3.1923828125, -2.911376953125, -2.63037109375, -2.349365234375, -2.068359375, -1.787353515625, -1.50634765625, -1.225341796875, -0.9443359375, -0.663330078125, -0.38232421875, -0.101318359375, 0.1796875, 0.460693359375, 0.74169921875, 1.022705078125, 1.3037109375, 1.584716796875, 1.86572265625, 2.146728515625, 2.427734375, 2.708740234375, 2.98974609375, 3.270751953125, 3.5517578125, 3.832763671875, 4.11376953125, 4.394775390625, 4.67578125, 4.956787109375, 5.23779296875, 5.518798828125, 5.7998046875, 6.080810546875, 6.36181640625, 6.642822265625, 6.923828125, 7.204833984375, 7.48583984375, 7.766845703125, 8.0478515625, 8.328857421875, 8.60986328125, 8.890869140625, 9.171875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 9.0, 26.0, 39.0, 62.0, 80.0, 111.0, 136.0, 147.0, 163.0, 96.0, 65.0, 42.0, 10.0, 12.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.515625, -27.421142578125, -26.32666015625, -25.232177734375, -24.1376953125, -23.043212890625, -21.94873046875, -20.854248046875, -19.759765625, -18.665283203125, -17.57080078125, -16.476318359375, -15.3818359375, -14.287353515625, -13.19287109375, -12.098388671875, -11.00390625, -9.909423828125, -8.81494140625, -7.720458984375, -6.6259765625, -5.531494140625, -4.43701171875, -3.342529296875, -2.248046875, -1.153564453125, -0.05908203125, 1.035400390625, 2.1298828125, 3.224365234375, 4.31884765625, 5.413330078125, 6.5078125, 7.602294921875, 8.69677734375, 9.791259765625, 10.8857421875, 11.980224609375, 13.07470703125, 14.169189453125, 15.263671875, 16.358154296875, 17.45263671875, 18.547119140625, 19.6416015625, 20.736083984375, 21.83056640625, 22.925048828125, 24.01953125, 25.114013671875, 26.20849609375, 27.302978515625, 28.3974609375, 29.491943359375, 30.58642578125, 31.680908203125, 32.775390625, 33.869873046875, 34.96435546875, 36.058837890625, 37.1533203125, 38.247802734375, 39.34228515625, 40.436767578125, 41.53125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 1.0, 5.0, 6.0, 3.0, 16.0, 15.0, 31.0, 46.0, 64.0, 122.0, 207.0, 290.0, 652.0, 1133.0, 2172.0, 4372.0, 9124.0, 19155.0, 42067.0, 91359.0, 181926.0, 265962.0, 214577.0, 114305.0, 53748.0, 24562.0, 11378.0, 5501.0, 2596.0, 1422.0, 773.0, 421.0, 215.0, 134.0, 73.0, 44.0, 26.0, 27.0, 10.0, 8.0, 8.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.40234375, -1.347686767578125, -1.29302978515625, -1.238372802734375, -1.1837158203125, -1.129058837890625, -1.07440185546875, -1.019744873046875, -0.965087890625, -0.910430908203125, -0.85577392578125, -0.801116943359375, -0.7464599609375, -0.691802978515625, -0.63714599609375, -0.582489013671875, -0.52783203125, -0.473175048828125, -0.41851806640625, -0.363861083984375, -0.3092041015625, -0.254547119140625, -0.19989013671875, -0.145233154296875, -0.090576171875, -0.035919189453125, 0.01873779296875, 0.073394775390625, 0.1280517578125, 0.182708740234375, 0.23736572265625, 0.292022705078125, 0.3466796875, 0.401336669921875, 0.45599365234375, 0.510650634765625, 0.5653076171875, 0.619964599609375, 0.67462158203125, 0.729278564453125, 0.783935546875, 0.838592529296875, 0.89324951171875, 0.947906494140625, 1.0025634765625, 1.057220458984375, 1.11187744140625, 1.166534423828125, 1.22119140625, 1.275848388671875, 1.33050537109375, 1.385162353515625, 1.4398193359375, 1.494476318359375, 1.54913330078125, 1.603790283203125, 1.658447265625, 1.713104248046875, 1.76776123046875, 1.822418212890625, 1.8770751953125, 1.931732177734375, 1.98638916015625, 2.041046142578125, 2.095703125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 2.0, 5.0, 6.0, 7.0, 7.0, 12.0, 10.0, 13.0, 23.0, 24.0, 35.0, 44.0, 31.0, 42.0, 57.0, 64.0, 51.0, 56.0, 73.0, 63.0, 48.0, 42.0, 39.0, 50.0, 33.0, 28.0, 33.0, 21.0, 18.0, 23.0, 14.0, 9.0, 7.0, 5.0, 7.0, 0.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.640625, -22.7802734375, -21.919921875, -21.0595703125, -20.19921875, -19.3388671875, -18.478515625, -17.6181640625, -16.7578125, -15.8974609375, -15.037109375, -14.1767578125, -13.31640625, -12.4560546875, -11.595703125, -10.7353515625, -9.875, -9.0146484375, -8.154296875, -7.2939453125, -6.43359375, -5.5732421875, -4.712890625, -3.8525390625, -2.9921875, -2.1318359375, -1.271484375, -0.4111328125, 0.44921875, 1.3095703125, 2.169921875, 3.0302734375, 3.890625, 4.7509765625, 5.611328125, 6.4716796875, 7.33203125, 8.1923828125, 9.052734375, 9.9130859375, 10.7734375, 11.6337890625, 12.494140625, 13.3544921875, 14.21484375, 15.0751953125, 15.935546875, 16.7958984375, 17.65625, 18.5166015625, 19.376953125, 20.2373046875, 21.09765625, 21.9580078125, 22.818359375, 23.6787109375, 24.5390625, 25.3994140625, 26.259765625, 27.1201171875, 27.98046875, 28.8408203125, 29.701171875, 30.5615234375, 31.421875]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 2.0, 1.0, 1.0, 7.0, 6.0, 9.0, 16.0, 16.0, 33.0, 35.0, 62.0, 79.0, 131.0, 194.0, 322.0, 531.0, 935.0, 1768.0, 3513.0, 7874.0, 19857.0, 55350.0, 159286.0, 349576.0, 280678.0, 106454.0, 36884.0, 13515.0, 5431.0, 2523.0, 1333.0, 805.0, 445.0, 317.0, 185.0, 127.0, 85.0, 47.0, 36.0, 32.0, 12.0, 16.0, 7.0, 5.0, 10.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.28759765625, -0.27933502197265625, -0.2710723876953125, -0.26280975341796875, -0.254547119140625, -0.24628448486328125, -0.2380218505859375, -0.22975921630859375, -0.22149658203125, -0.21323394775390625, -0.2049713134765625, -0.19670867919921875, -0.188446044921875, -0.18018341064453125, -0.1719207763671875, -0.16365814208984375, -0.1553955078125, -0.14713287353515625, -0.1388702392578125, -0.13060760498046875, -0.122344970703125, -0.11408233642578125, -0.1058197021484375, -0.09755706787109375, -0.08929443359375, -0.08103179931640625, -0.0727691650390625, -0.06450653076171875, -0.056243896484375, -0.04798126220703125, -0.0397186279296875, -0.03145599365234375, -0.023193359375, -0.01493072509765625, -0.0066680908203125, 0.00159454345703125, 0.009857177734375, 0.01811981201171875, 0.0263824462890625, 0.03464508056640625, 0.04290771484375, 0.05117034912109375, 0.0594329833984375, 0.06769561767578125, 0.075958251953125, 0.08422088623046875, 0.0924835205078125, 0.10074615478515625, 0.1090087890625, 0.11727142333984375, 0.1255340576171875, 0.13379669189453125, 0.142059326171875, 0.15032196044921875, 0.1585845947265625, 0.16684722900390625, 0.17510986328125, 0.18337249755859375, 0.1916351318359375, 0.19989776611328125, 0.208160400390625, 0.21642303466796875, 0.2246856689453125, 0.23294830322265625, 0.2412109375]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 9.0, 9.0, 11.0, 17.0, 15.0, 22.0, 29.0, 47.0, 69.0, 81.0, 81.0, 95.0, 87.0, 107.0, 78.0, 59.0, 40.0, 42.0, 26.0, 22.0, 21.0, 11.0, 6.0, 5.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002665519714355469, -0.0002591572701931, -0.0002517625689506531, -0.0002443678677082062, -0.00023697316646575928, -0.00022957846522331238, -0.00022218376398086548, -0.00021478906273841858, -0.00020739436149597168, -0.00019999966025352478, -0.00019260495901107788, -0.00018521025776863098, -0.00017781555652618408, -0.00017042085528373718, -0.00016302615404129028, -0.00015563145279884338, -0.00014823675155639648, -0.00014084205031394958, -0.00013344734907150269, -0.00012605264782905579, -0.00011865794658660889, -0.00011126324534416199, -0.00010386854410171509, -9.647384285926819e-05, -8.907914161682129e-05, -8.168444037437439e-05, -7.428973913192749e-05, -6.689503788948059e-05, -5.950033664703369e-05, -5.210563540458679e-05, -4.471093416213989e-05, -3.731623291969299e-05, -2.9921531677246094e-05, -2.2526830434799194e-05, -1.5132129192352295e-05, -7.737427949905396e-06, -3.427267074584961e-07, 7.051974534988403e-06, 1.4446675777435303e-05, 2.1841377019882202e-05, 2.92360782623291e-05, 3.6630779504776e-05, 4.40254807472229e-05, 5.14201819896698e-05, 5.88148832321167e-05, 6.62095844745636e-05, 7.36042857170105e-05, 8.09989869594574e-05, 8.83936882019043e-05, 9.57883894443512e-05, 0.0001031830906867981, 0.000110577791929245, 0.0001179724931716919, 0.0001253671944141388, 0.0001327618956565857, 0.0001401565968990326, 0.0001475512981414795, 0.0001549459993839264, 0.0001623407006263733, 0.0001697354018688202, 0.0001771301031112671, 0.000184524804353714, 0.0001919195055961609, 0.0001993142068386078, 0.0002067089080810547]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 7.0, 14.0, 25.0, 25.0, 33.0, 61.0, 91.0, 114.0, 283.0, 491.0, 1011.0, 2332.0, 6032.0, 18428.0, 65680.0, 241700.0, 441273.0, 195087.0, 52048.0, 15039.0, 4995.0, 1901.0, 840.0, 429.0, 233.0, 116.0, 87.0, 45.0, 33.0, 27.0, 14.0, 6.0, 14.0, 13.0, 2.0, 2.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.298583984375, -0.2890777587890625, -0.279571533203125, -0.2700653076171875, -0.26055908203125, -0.2510528564453125, -0.241546630859375, -0.2320404052734375, -0.2225341796875, -0.2130279541015625, -0.203521728515625, -0.1940155029296875, -0.18450927734375, -0.1750030517578125, -0.165496826171875, -0.1559906005859375, -0.146484375, -0.1369781494140625, -0.127471923828125, -0.1179656982421875, -0.10845947265625, -0.0989532470703125, -0.089447021484375, -0.0799407958984375, -0.0704345703125, -0.0609283447265625, -0.051422119140625, -0.0419158935546875, -0.03240966796875, -0.0229034423828125, -0.013397216796875, -0.0038909912109375, 0.005615234375, 0.0151214599609375, 0.024627685546875, 0.0341339111328125, 0.04364013671875, 0.0531463623046875, 0.062652587890625, 0.0721588134765625, 0.0816650390625, 0.0911712646484375, 0.100677490234375, 0.1101837158203125, 0.11968994140625, 0.1291961669921875, 0.138702392578125, 0.1482086181640625, 0.15771484375, 0.1672210693359375, 0.176727294921875, 0.1862335205078125, 0.19573974609375, 0.2052459716796875, 0.214752197265625, 0.2242584228515625, 0.2337646484375, 0.2432708740234375, 0.252777099609375, 0.2622833251953125, 0.27178955078125, 0.2812957763671875, 0.290802001953125, 0.3003082275390625, 0.309814453125]}, "gradients/decoder.model.decoder.layers.7.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 6.0, 9.0, 14.0, 7.0, 12.0, 19.0, 23.0, 25.0, 33.0, 42.0, 62.0, 64.0, 63.0, 70.0, 70.0, 76.0, 61.0, 50.0, 54.0, 51.0, 37.0, 21.0, 19.0, 27.0, 14.0, 12.0, 9.0, 11.0, 6.0, 3.0, 5.0, 4.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08709716796875, -0.08430957794189453, -0.08152198791503906, -0.0787343978881836, -0.07594680786132812, -0.07315921783447266, -0.07037162780761719, -0.06758403778076172, -0.06479644775390625, -0.06200885772705078, -0.05922126770019531, -0.056433677673339844, -0.053646087646484375, -0.050858497619628906, -0.04807090759277344, -0.04528331756591797, -0.0424957275390625, -0.03970813751220703, -0.03692054748535156, -0.034132957458496094, -0.031345367431640625, -0.028557777404785156, -0.025770187377929688, -0.02298259735107422, -0.02019500732421875, -0.01740741729736328, -0.014619827270507812, -0.011832237243652344, -0.009044647216796875, -0.006257057189941406, -0.0034694671630859375, -0.0006818771362304688, 0.002105712890625, 0.004893302917480469, 0.0076808929443359375, 0.010468482971191406, 0.013256072998046875, 0.016043663024902344, 0.018831253051757812, 0.02161884307861328, 0.02440643310546875, 0.02719402313232422, 0.029981613159179688, 0.032769203186035156, 0.035556793212890625, 0.038344383239746094, 0.04113197326660156, 0.04391956329345703, 0.0467071533203125, 0.04949474334716797, 0.05228233337402344, 0.055069923400878906, 0.057857513427734375, 0.060645103454589844, 0.06343269348144531, 0.06622028350830078, 0.06900787353515625, 0.07179546356201172, 0.07458305358886719, 0.07737064361572266, 0.08015823364257812, 0.0829458236694336, 0.08573341369628906, 0.08852100372314453, 0.09130859375]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 16.0, 28.0, 59.0, 103.0, 166.0, 187.0, 190.0, 136.0, 62.0, 30.0, 12.0, 5.0, 4.0, 2.0, 2.0, 1.0], "bins": [-52.15959930419922, -51.184383392333984, -50.20916748046875, -49.233951568603516, -48.25873565673828, -47.28351593017578, -46.30830383300781, -45.33308410644531, -44.35786819458008, -43.382652282714844, -42.40743637084961, -41.432220458984375, -40.45700454711914, -39.481788635253906, -38.506568908691406, -37.53135299682617, -36.55613708496094, -35.5809211730957, -34.60570526123047, -33.630489349365234, -32.6552734375, -31.680055618286133, -30.7048397064209, -29.729623794555664, -28.754409790039062, -27.779193878173828, -26.803977966308594, -25.82876205444336, -24.853544235229492, -23.878328323364258, -22.903112411499023, -21.92789649963379, -20.95267677307129, -19.977460861206055, -19.00224494934082, -18.027027130126953, -17.05181121826172, -16.076595306396484, -15.10137939453125, -14.126163482666016, -13.150946617126465, -12.17573070526123, -11.20051383972168, -10.225297927856445, -9.250082015991211, -8.27486515045166, -7.299649238586426, -6.324432849884033, -5.349216461181641, -4.374000072479248, -3.3987839221954346, -2.423567771911621, -1.4483513832092285, -0.47313499450683594, 0.5020809173583984, 1.477297306060791, 2.4525136947631836, 3.427730083465576, 4.402946472167969, 5.378162384033203, 6.353378772735596, 7.328595161437988, 8.303811073303223, 9.279027938842773, 10.254243850708008]}, "gradients/decoder.model.decoder.layers.7.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 7.0, 12.0, 17.0, 15.0, 21.0, 29.0, 29.0, 53.0, 52.0, 71.0, 73.0, 76.0, 91.0, 86.0, 95.0, 76.0, 57.0, 38.0, 35.0, 31.0, 18.0, 6.0, 10.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-28.47494125366211, -27.84413719177246, -27.213335037231445, -26.582530975341797, -25.95172691345215, -25.320924758911133, -24.690120697021484, -24.05931854248047, -23.42851448059082, -22.797710418701172, -22.166908264160156, -21.536104202270508, -20.90530014038086, -20.274497985839844, -19.643693923950195, -19.012889862060547, -18.38208770751953, -17.751283645629883, -17.120481491088867, -16.48967742919922, -15.858874320983887, -15.228071212768555, -14.597267150878906, -13.966464042663574, -13.33565902709961, -12.704855918884277, -12.074051856994629, -11.443248748779297, -10.812445640563965, -10.181642532348633, -9.550838470458984, -8.920035362243652, -8.28923225402832, -7.65842866897583, -7.027625560760498, -6.396821975708008, -5.766018867492676, -5.1352152824401855, -4.504411697387695, -3.8736085891723633, -3.242805004119873, -2.612001657485962, -1.9811981916427612, -1.3503947257995605, -0.7195913791656494, -0.08878803253173828, 0.542015552520752, 1.172818660736084, 1.8036222457885742, 2.4344255924224854, 3.0652289390563965, 3.6960325241088867, 4.326835632324219, 4.957639217376709, 5.588442802429199, 6.219245910644531, 6.8500494956970215, 7.480853080749512, 8.111656188964844, 8.742460250854492, 9.373263359069824, 10.004066467285156, 10.634870529174805, 11.26567268371582, 11.896476745605469]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 8.0, 4.0, 11.0, 6.0, 11.0, 8.0, 21.0, 24.0, 32.0, 27.0, 44.0, 55.0, 137.0, 335.0, 1341.0, 8924.0, 85326.0, 596166.0, 318457.0, 32475.0, 3808.0, 749.0, 209.0, 98.0, 73.0, 35.0, 30.0, 25.0, 24.0, 18.0, 18.0, 12.0, 6.0, 8.0, 7.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.09375, -22.318603515625, -21.54345703125, -20.768310546875, -19.9931640625, -19.218017578125, -18.44287109375, -17.667724609375, -16.892578125, -16.117431640625, -15.34228515625, -14.567138671875, -13.7919921875, -13.016845703125, -12.24169921875, -11.466552734375, -10.69140625, -9.916259765625, -9.14111328125, -8.365966796875, -7.5908203125, -6.815673828125, -6.04052734375, -5.265380859375, -4.490234375, -3.715087890625, -2.93994140625, -2.164794921875, -1.3896484375, -0.614501953125, 0.16064453125, 0.935791015625, 1.7109375, 2.486083984375, 3.26123046875, 4.036376953125, 4.8115234375, 5.586669921875, 6.36181640625, 7.136962890625, 7.912109375, 8.687255859375, 9.46240234375, 10.237548828125, 11.0126953125, 11.787841796875, 12.56298828125, 13.338134765625, 14.11328125, 14.888427734375, 15.66357421875, 16.438720703125, 17.2138671875, 17.989013671875, 18.76416015625, 19.539306640625, 20.314453125, 21.089599609375, 21.86474609375, 22.639892578125, 23.4150390625, 24.190185546875, 24.96533203125, 25.740478515625, 26.515625]}, "gradients/decoder.model.decoder.layers.7.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 5.0, 12.0, 13.0, 7.0, 11.0, 29.0, 31.0, 28.0, 51.0, 37.0, 63.0, 49.0, 74.0, 80.0, 81.0, 76.0, 75.0, 68.0, 46.0, 43.0, 33.0, 31.0, 26.0, 10.0, 12.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.96875, -38.9892578125, -38.009765625, -37.0302734375, -36.05078125, -35.0712890625, -34.091796875, -33.1123046875, -32.1328125, -31.1533203125, -30.173828125, -29.1943359375, -28.21484375, -27.2353515625, -26.255859375, -25.2763671875, -24.296875, -23.3173828125, -22.337890625, -21.3583984375, -20.37890625, -19.3994140625, -18.419921875, -17.4404296875, -16.4609375, -15.4814453125, -14.501953125, -13.5224609375, -12.54296875, -11.5634765625, -10.583984375, -9.6044921875, -8.625, -7.6455078125, -6.666015625, -5.6865234375, -4.70703125, -3.7275390625, -2.748046875, -1.7685546875, -0.7890625, 0.1904296875, 1.169921875, 2.1494140625, 3.12890625, 4.1083984375, 5.087890625, 6.0673828125, 7.046875, 8.0263671875, 9.005859375, 9.9853515625, 10.96484375, 11.9443359375, 12.923828125, 13.9033203125, 14.8828125, 15.8623046875, 16.841796875, 17.8212890625, 18.80078125, 19.7802734375, 20.759765625, 21.7392578125, 22.71875]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 7.0, 14.0, 7.0, 12.0, 19.0, 32.0, 35.0, 59.0, 56.0, 84.0, 96.0, 124.0, 150.0, 210.0, 257.0, 460.0, 2136.0, 37750.0, 731741.0, 264252.0, 8892.0, 816.0, 310.0, 226.0, 186.0, 127.0, 105.0, 92.0, 67.0, 56.0, 45.0, 41.0, 32.0, 18.0, 14.0, 12.0, 5.0, 3.0, 5.0, 3.0, 2.0, 1.0, 2.0, 1.0], "bins": [-40.34375, -39.303466796875, -38.26318359375, -37.222900390625, -36.1826171875, -35.142333984375, -34.10205078125, -33.061767578125, -32.021484375, -30.981201171875, -29.94091796875, -28.900634765625, -27.8603515625, -26.820068359375, -25.77978515625, -24.739501953125, -23.69921875, -22.658935546875, -21.61865234375, -20.578369140625, -19.5380859375, -18.497802734375, -17.45751953125, -16.417236328125, -15.376953125, -14.336669921875, -13.29638671875, -12.256103515625, -11.2158203125, -10.175537109375, -9.13525390625, -8.094970703125, -7.0546875, -6.014404296875, -4.97412109375, -3.933837890625, -2.8935546875, -1.853271484375, -0.81298828125, 0.227294921875, 1.267578125, 2.307861328125, 3.34814453125, 4.388427734375, 5.4287109375, 6.468994140625, 7.50927734375, 8.549560546875, 9.58984375, 10.630126953125, 11.67041015625, 12.710693359375, 13.7509765625, 14.791259765625, 15.83154296875, 16.871826171875, 17.912109375, 18.952392578125, 19.99267578125, 21.032958984375, 22.0732421875, 23.113525390625, 24.15380859375, 25.194091796875, 26.234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 5.0, 7.0, 11.0, 7.0, 7.0, 14.0, 17.0, 15.0, 20.0, 18.0, 24.0, 38.0, 41.0, 34.0, 43.0, 40.0, 44.0, 41.0, 49.0, 33.0, 37.0, 37.0, 50.0, 41.0, 37.0, 44.0, 37.0, 37.0, 25.0, 29.0, 24.0, 15.0, 8.0, 12.0, 12.0, 8.0, 15.0, 12.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.421875, -20.775634765625, -20.12939453125, -19.483154296875, -18.8369140625, -18.190673828125, -17.54443359375, -16.898193359375, -16.251953125, -15.605712890625, -14.95947265625, -14.313232421875, -13.6669921875, -13.020751953125, -12.37451171875, -11.728271484375, -11.08203125, -10.435791015625, -9.78955078125, -9.143310546875, -8.4970703125, -7.850830078125, -7.20458984375, -6.558349609375, -5.912109375, -5.265869140625, -4.61962890625, -3.973388671875, -3.3271484375, -2.680908203125, -2.03466796875, -1.388427734375, -0.7421875, -0.095947265625, 0.55029296875, 1.196533203125, 1.8427734375, 2.489013671875, 3.13525390625, 3.781494140625, 4.427734375, 5.073974609375, 5.72021484375, 6.366455078125, 7.0126953125, 7.658935546875, 8.30517578125, 8.951416015625, 9.59765625, 10.243896484375, 10.89013671875, 11.536376953125, 12.1826171875, 12.828857421875, 13.47509765625, 14.121337890625, 14.767578125, 15.413818359375, 16.06005859375, 16.706298828125, 17.3525390625, 17.998779296875, 18.64501953125, 19.291259765625, 19.9375]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 7.0, 6.0, 6.0, 3.0, 12.0, 15.0, 25.0, 59.0, 69.0, 150.0, 409.0, 1421.0, 6400.0, 64483.0, 863614.0, 101680.0, 7579.0, 1746.0, 483.0, 163.0, 78.0, 45.0, 19.0, 14.0, 11.0, 9.0, 6.0, 5.0, 5.0, 4.0, 6.0, 5.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.4765625, -12.0933837890625, -11.710205078125, -11.3270263671875, -10.94384765625, -10.5606689453125, -10.177490234375, -9.7943115234375, -9.4111328125, -9.0279541015625, -8.644775390625, -8.2615966796875, -7.87841796875, -7.4952392578125, -7.112060546875, -6.7288818359375, -6.345703125, -5.9625244140625, -5.579345703125, -5.1961669921875, -4.81298828125, -4.4298095703125, -4.046630859375, -3.6634521484375, -3.2802734375, -2.8970947265625, -2.513916015625, -2.1307373046875, -1.74755859375, -1.3643798828125, -0.981201171875, -0.5980224609375, -0.21484375, 0.1683349609375, 0.551513671875, 0.9346923828125, 1.31787109375, 1.7010498046875, 2.084228515625, 2.4674072265625, 2.8505859375, 3.2337646484375, 3.616943359375, 4.0001220703125, 4.38330078125, 4.7664794921875, 5.149658203125, 5.5328369140625, 5.916015625, 6.2991943359375, 6.682373046875, 7.0655517578125, 7.44873046875, 7.8319091796875, 8.215087890625, 8.5982666015625, 8.9814453125, 9.3646240234375, 9.747802734375, 10.1309814453125, 10.51416015625, 10.8973388671875, 11.280517578125, 11.6636962890625, 12.046875]}, "gradients/decoder.model.decoder.layers.7.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 4.0, 10.0, 17.0, 12.0, 20.0, 32.0, 52.0, 44.0, 73.0, 80.0, 118.0, 112.0, 98.0, 89.0, 62.0, 50.0, 40.0, 25.0, 19.0, 11.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007719993591308594, -0.0007390156388282776, -0.0007060319185256958, -0.000673048198223114, -0.0006400644779205322, -0.0006070807576179504, -0.0005740970373153687, -0.0005411133170127869, -0.0005081295967102051, -0.0004751458764076233, -0.0004421621561050415, -0.0004091784358024597, -0.00037619471549987793, -0.00034321099519729614, -0.00031022727489471436, -0.00027724355459213257, -0.0002442598342895508, -0.000211276113986969, -0.0001782923936843872, -0.00014530867338180542, -0.00011232495307922363, -7.934123277664185e-05, -4.635751247406006e-05, -1.3373792171478271e-05, 1.9609928131103516e-05, 5.25936484336853e-05, 8.557736873626709e-05, 0.00011856108903884888, 0.00015154480934143066, 0.00018452852964401245, 0.00021751224994659424, 0.000250495970249176, 0.0002834796905517578, 0.0003164634108543396, 0.0003494471311569214, 0.0003824308514595032, 0.00041541457176208496, 0.00044839829206466675, 0.00048138201236724854, 0.0005143657326698303, 0.0005473494529724121, 0.0005803331732749939, 0.0006133168935775757, 0.0006463006138801575, 0.0006792843341827393, 0.000712268054485321, 0.0007452517747879028, 0.0007782354950904846, 0.0008112192153930664, 0.0008442029356956482, 0.00087718665599823, 0.0009101703763008118, 0.0009431540966033936, 0.0009761378169059753, 0.0010091215372085571, 0.001042105257511139, 0.0010750889778137207, 0.0011080726981163025, 0.0011410564184188843, 0.001174040138721466, 0.0012070238590240479, 0.0012400075793266296, 0.0012729912996292114, 0.0013059750199317932, 0.001338958740234375]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 2.0, 5.0, 5.0, 11.0, 13.0, 23.0, 26.0, 36.0, 67.0, 93.0, 190.0, 587.0, 2478.0, 19678.0, 611911.0, 397853.0, 12831.0, 1816.0, 456.0, 181.0, 79.0, 58.0, 48.0, 25.0, 20.0, 11.0, 7.0, 8.0, 4.0, 1.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.3125, -11.914306640625, -11.51611328125, -11.117919921875, -10.7197265625, -10.321533203125, -9.92333984375, -9.525146484375, -9.126953125, -8.728759765625, -8.33056640625, -7.932373046875, -7.5341796875, -7.135986328125, -6.73779296875, -6.339599609375, -5.94140625, -5.543212890625, -5.14501953125, -4.746826171875, -4.3486328125, -3.950439453125, -3.55224609375, -3.154052734375, -2.755859375, -2.357666015625, -1.95947265625, -1.561279296875, -1.1630859375, -0.764892578125, -0.36669921875, 0.031494140625, 0.4296875, 0.827880859375, 1.22607421875, 1.624267578125, 2.0224609375, 2.420654296875, 2.81884765625, 3.217041015625, 3.615234375, 4.013427734375, 4.41162109375, 4.809814453125, 5.2080078125, 5.606201171875, 6.00439453125, 6.402587890625, 6.80078125, 7.198974609375, 7.59716796875, 7.995361328125, 8.3935546875, 8.791748046875, 9.18994140625, 9.588134765625, 9.986328125, 10.384521484375, 10.78271484375, 11.180908203125, 11.5791015625, 11.977294921875, 12.37548828125, 12.773681640625, 13.171875]}, "gradients/decoder.model.decoder.layers.7.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 6.0, 8.0, 14.0, 22.0, 22.0, 21.0, 47.0, 51.0, 66.0, 60.0, 81.0, 95.0, 101.0, 81.0, 66.0, 51.0, 48.0, 37.0, 30.0, 26.0, 9.0, 15.0, 2.0, 2.0, 5.0, 7.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.736328125, -2.655487060546875, -2.57464599609375, -2.493804931640625, -2.4129638671875, -2.332122802734375, -2.25128173828125, -2.170440673828125, -2.089599609375, -2.008758544921875, -1.92791748046875, -1.847076416015625, -1.7662353515625, -1.685394287109375, -1.60455322265625, -1.523712158203125, -1.44287109375, -1.362030029296875, -1.28118896484375, -1.200347900390625, -1.1195068359375, -1.038665771484375, -0.95782470703125, -0.876983642578125, -0.796142578125, -0.715301513671875, -0.63446044921875, -0.553619384765625, -0.4727783203125, -0.391937255859375, -0.31109619140625, -0.230255126953125, -0.1494140625, -0.068572998046875, 0.01226806640625, 0.093109130859375, 0.1739501953125, 0.254791259765625, 0.33563232421875, 0.416473388671875, 0.497314453125, 0.578155517578125, 0.65899658203125, 0.739837646484375, 0.8206787109375, 0.901519775390625, 0.98236083984375, 1.063201904296875, 1.14404296875, 1.224884033203125, 1.30572509765625, 1.386566162109375, 1.4674072265625, 1.548248291015625, 1.62908935546875, 1.709930419921875, 1.790771484375, 1.871612548828125, 1.95245361328125, 2.033294677734375, 2.1141357421875, 2.194976806640625, 2.27581787109375, 2.356658935546875, 2.4375]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 17.0, 30.0, 73.0, 108.0, 182.0, 186.0, 174.0, 130.0, 52.0, 29.0, 8.0, 7.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.426513671875, -70.48649597167969, -68.54647064208984, -66.60645294189453, -64.66643524169922, -62.72641372680664, -60.78639602661133, -58.84637451171875, -56.90635681152344, -54.96633529663086, -53.02631759643555, -51.08629608154297, -49.146278381347656, -47.20625686645508, -45.266239166259766, -43.32621765136719, -41.386199951171875, -39.4461784362793, -37.506160736083984, -35.566139221191406, -33.626121520996094, -31.686100006103516, -29.746082305908203, -27.806060791015625, -25.866039276123047, -23.9260196685791, -21.986000061035156, -20.04598045349121, -18.105960845947266, -16.165939331054688, -14.225920677185059, -12.285901069641113, -10.345882415771484, -8.405862808227539, -6.465843200683594, -4.52582311630249, -2.585803508758545, -0.6457834243774414, 1.294236183166504, 3.234255790710449, 5.1742753982543945, 7.11429500579834, 9.054314613342285, 10.994335174560547, 12.934354782104492, 14.874374389648438, 16.814393997192383, 18.754413604736328, 20.694433212280273, 22.63445281982422, 24.574472427368164, 26.51449203491211, 28.454511642456055, 30.39453125, 32.33455276489258, 34.27457046508789, 36.21459197998047, 38.15461349487305, 40.09463119506836, 42.03465270996094, 43.97467041015625, 45.91469192504883, 47.85470962524414, 49.79473114013672, 51.73474884033203]}, "gradients/decoder.model.decoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 4.0, 3.0, 6.0, 7.0, 8.0, 11.0, 9.0, 14.0, 21.0, 17.0, 31.0, 23.0, 25.0, 30.0, 49.0, 34.0, 44.0, 34.0, 41.0, 48.0, 49.0, 45.0, 50.0, 50.0, 44.0, 44.0, 41.0, 26.0, 29.0, 26.0, 21.0, 24.0, 25.0, 11.0, 13.0, 13.0, 12.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-41.74582290649414, -40.507667541503906, -39.269508361816406, -38.03135299682617, -36.79319381713867, -35.55503845214844, -34.31687927246094, -33.0787239074707, -31.840566635131836, -30.60240936279297, -29.3642520904541, -28.126094818115234, -26.887939453125, -25.6497802734375, -24.411624908447266, -23.1734676361084, -21.93531036376953, -20.697153091430664, -19.458995819091797, -18.22083854675293, -16.982681274414062, -15.744524955749512, -14.506368637084961, -13.268211364746094, -12.030054092407227, -10.79189682006836, -9.553739547729492, -8.315583229064941, -7.077425956726074, -5.839268684387207, -4.601111888885498, -3.362955093383789, -2.124797821044922, -0.8866407871246338, 0.3515162467956543, 1.5896732807159424, 2.8278303146362305, 4.065987586975098, 5.304144382476807, 6.542301177978516, 7.780458450317383, 9.01861572265625, 10.256772994995117, 11.494929313659668, 12.733086585998535, 13.971243858337402, 15.209400177001953, 16.44755744934082, 17.685714721679688, 18.923871994018555, 20.162029266357422, 21.40018653869629, 22.638343811035156, 23.87649917602539, 25.114656448364258, 26.352813720703125, 27.590970993041992, 28.82912826538086, 30.067285537719727, 31.305442810058594, 32.54359817504883, 33.78175735473633, 35.01991271972656, 36.25807189941406, 37.4962272644043]}, "gradients/decoder.model.decoder.layers.6.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 10.0, 13.0, 15.0, 26.0, 39.0, 54.0, 63.0, 94.0, 138.0, 212.0, 321.0, 535.0, 1170.0, 6264.0, 124165.0, 2439977.0, 1543421.0, 70928.0, 4776.0, 880.0, 405.0, 263.0, 163.0, 106.0, 81.0, 38.0, 30.0, 27.0, 11.0, 9.0, 11.0, 5.0, 10.0, 4.0, 4.0, 1.0, 3.0, 3.0, 2.0], "bins": [-42.09375, -41.064453125, -40.03515625, -39.005859375, -37.9765625, -36.947265625, -35.91796875, -34.888671875, -33.859375, -32.830078125, -31.80078125, -30.771484375, -29.7421875, -28.712890625, -27.68359375, -26.654296875, -25.625, -24.595703125, -23.56640625, -22.537109375, -21.5078125, -20.478515625, -19.44921875, -18.419921875, -17.390625, -16.361328125, -15.33203125, -14.302734375, -13.2734375, -12.244140625, -11.21484375, -10.185546875, -9.15625, -8.126953125, -7.09765625, -6.068359375, -5.0390625, -4.009765625, -2.98046875, -1.951171875, -0.921875, 0.107421875, 1.13671875, 2.166015625, 3.1953125, 4.224609375, 5.25390625, 6.283203125, 7.3125, 8.341796875, 9.37109375, 10.400390625, 11.4296875, 12.458984375, 13.48828125, 14.517578125, 15.546875, 16.576171875, 17.60546875, 18.634765625, 19.6640625, 20.693359375, 21.72265625, 22.751953125, 23.78125]}, "gradients/decoder.model.decoder.layers.6.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 2.0, 9.0, 13.0, 11.0, 14.0, 16.0, 11.0, 19.0, 37.0, 33.0, 39.0, 45.0, 49.0, 47.0, 68.0, 66.0, 55.0, 73.0, 52.0, 56.0, 59.0, 47.0, 41.0, 35.0, 25.0, 25.0, 17.0, 12.0, 8.0, 2.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-24.421875, -23.780517578125, -23.13916015625, -22.497802734375, -21.8564453125, -21.215087890625, -20.57373046875, -19.932373046875, -19.291015625, -18.649658203125, -18.00830078125, -17.366943359375, -16.7255859375, -16.084228515625, -15.44287109375, -14.801513671875, -14.16015625, -13.518798828125, -12.87744140625, -12.236083984375, -11.5947265625, -10.953369140625, -10.31201171875, -9.670654296875, -9.029296875, -8.387939453125, -7.74658203125, -7.105224609375, -6.4638671875, -5.822509765625, -5.18115234375, -4.539794921875, -3.8984375, -3.257080078125, -2.61572265625, -1.974365234375, -1.3330078125, -0.691650390625, -0.05029296875, 0.591064453125, 1.232421875, 1.873779296875, 2.51513671875, 3.156494140625, 3.7978515625, 4.439208984375, 5.08056640625, 5.721923828125, 6.36328125, 7.004638671875, 7.64599609375, 8.287353515625, 8.9287109375, 9.570068359375, 10.21142578125, 10.852783203125, 11.494140625, 12.135498046875, 12.77685546875, 13.418212890625, 14.0595703125, 14.700927734375, 15.34228515625, 15.983642578125, 16.625]}, "gradients/decoder.model.decoder.layers.6.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 10.0, 10.0, 16.0, 22.0, 41.0, 72.0, 110.0, 247.0, 534.0, 1552.0, 8289.0, 352666.0, 3739880.0, 84524.0, 4387.0, 1064.0, 418.0, 202.0, 109.0, 53.0, 26.0, 14.0, 16.0, 17.0, 7.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-55.0625, -53.87451171875, -52.6865234375, -51.49853515625, -50.310546875, -49.12255859375, -47.9345703125, -46.74658203125, -45.55859375, -44.37060546875, -43.1826171875, -41.99462890625, -40.806640625, -39.61865234375, -38.4306640625, -37.24267578125, -36.0546875, -34.86669921875, -33.6787109375, -32.49072265625, -31.302734375, -30.11474609375, -28.9267578125, -27.73876953125, -26.55078125, -25.36279296875, -24.1748046875, -22.98681640625, -21.798828125, -20.61083984375, -19.4228515625, -18.23486328125, -17.046875, -15.85888671875, -14.6708984375, -13.48291015625, -12.294921875, -11.10693359375, -9.9189453125, -8.73095703125, -7.54296875, -6.35498046875, -5.1669921875, -3.97900390625, -2.791015625, -1.60302734375, -0.4150390625, 0.77294921875, 1.9609375, 3.14892578125, 4.3369140625, 5.52490234375, 6.712890625, 7.90087890625, 9.0888671875, 10.27685546875, 11.46484375, 12.65283203125, 13.8408203125, 15.02880859375, 16.216796875, 17.40478515625, 18.5927734375, 19.78076171875, 20.96875]}, "gradients/decoder.model.decoder.layers.6.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 7.0, 10.0, 16.0, 23.0, 34.0, 51.0, 51.0, 97.0, 146.0, 262.0, 361.0, 475.0, 529.0, 549.0, 454.0, 359.0, 218.0, 144.0, 95.0, 54.0, 42.0, 27.0, 22.0, 18.0, 14.0, 9.0, 2.0, 0.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84375, -4.6409912109375, -4.438232421875, -4.2354736328125, -4.03271484375, -3.8299560546875, -3.627197265625, -3.4244384765625, -3.2216796875, -3.0189208984375, -2.816162109375, -2.6134033203125, -2.41064453125, -2.2078857421875, -2.005126953125, -1.8023681640625, -1.599609375, -1.3968505859375, -1.194091796875, -0.9913330078125, -0.78857421875, -0.5858154296875, -0.383056640625, -0.1802978515625, 0.0224609375, 0.2252197265625, 0.427978515625, 0.6307373046875, 0.83349609375, 1.0362548828125, 1.239013671875, 1.4417724609375, 1.64453125, 1.8472900390625, 2.050048828125, 2.2528076171875, 2.45556640625, 2.6583251953125, 2.861083984375, 3.0638427734375, 3.2666015625, 3.4693603515625, 3.672119140625, 3.8748779296875, 4.07763671875, 4.2803955078125, 4.483154296875, 4.6859130859375, 4.888671875, 5.0914306640625, 5.294189453125, 5.4969482421875, 5.69970703125, 5.9024658203125, 6.105224609375, 6.3079833984375, 6.5107421875, 6.7135009765625, 6.916259765625, 7.1190185546875, 7.32177734375, 7.5245361328125, 7.727294921875, 7.9300537109375, 8.1328125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 17.0, 25.0, 33.0, 46.0, 75.0, 72.0, 99.0, 106.0, 117.0, 95.0, 83.0, 64.0, 59.0, 30.0, 26.0, 16.0, 15.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-38.80586624145508, -37.96184158325195, -37.11781692504883, -36.27379608154297, -35.429771423339844, -34.58574676513672, -33.741722106933594, -32.897701263427734, -32.05367660522461, -31.209651947021484, -30.365629196166992, -29.521604537963867, -28.677581787109375, -27.83355712890625, -26.989534378051758, -26.145509719848633, -25.30148696899414, -24.457462310791016, -23.613439559936523, -22.7694149017334, -21.925392150878906, -21.08136749267578, -20.23734474182129, -19.393320083618164, -18.54929542541504, -17.705270767211914, -16.861248016357422, -16.017223358154297, -15.173200607299805, -14.32917594909668, -13.485153198242188, -12.641128540039062, -11.797104835510254, -10.953081130981445, -10.109057426452637, -9.265033721923828, -8.42101001739502, -7.576985836029053, -6.732962131500244, -5.8889384269714355, -5.044914722442627, -4.200891017913818, -3.3568673133850098, -2.512843370437622, -1.6688196659088135, -0.8247957229614258, 0.019227981567382812, 0.8632516860961914, 1.707275390625, 2.5512990951538086, 3.395322799682617, 4.239346504211426, 5.083370208740234, 5.927394390106201, 6.77141809463501, 7.615441799163818, 8.459465026855469, 9.303488731384277, 10.147512435913086, 10.991536140441895, 11.835559844970703, 12.679584503173828, 13.52360725402832, 14.367631912231445, 15.211655616760254]}, "gradients/decoder.model.decoder.layers.6.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 10.0, 3.0, 16.0, 13.0, 14.0, 24.0, 25.0, 23.0, 26.0, 25.0, 31.0, 38.0, 43.0, 39.0, 41.0, 60.0, 57.0, 58.0, 53.0, 49.0, 46.0, 31.0, 49.0, 34.0, 30.0, 26.0, 28.0, 20.0, 21.0, 9.0, 9.0, 9.0, 8.0, 10.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-19.057518005371094, -18.486129760742188, -17.91474151611328, -17.343351364135742, -16.771963119506836, -16.20057487487793, -15.629186630249023, -15.0577974319458, -14.486408233642578, -13.915019989013672, -13.34363079071045, -12.772242546081543, -12.20085334777832, -11.629465103149414, -11.058076858520508, -10.486687660217285, -9.915299415588379, -9.343911170959473, -8.77252197265625, -8.201133728027344, -7.629744529724121, -7.058356285095215, -6.48696756362915, -5.915578842163086, -5.3441901206970215, -4.772801399230957, -4.201412677764893, -3.6300241947174072, -3.0586354732513428, -2.4872467517852783, -1.915858268737793, -1.3444695472717285, -0.7730808258056641, -0.20169216394424438, 0.3696964979171753, 0.9410851001739502, 1.5124738216400146, 2.083862543106079, 2.6552510261535645, 3.226639747619629, 3.7980284690856934, 4.369417190551758, 4.940805912017822, 5.512194633483887, 6.083582878112793, 6.654972076416016, 7.226360321044922, 7.797749042510986, 8.36913776397705, 8.940526008605957, 9.51191520690918, 10.083303451538086, 10.654692649841309, 11.226080894470215, 11.797470092773438, 12.368858337402344, 12.94024658203125, 13.511634826660156, 14.083024024963379, 14.654412269592285, 15.225801467895508, 15.797189712524414, 16.36857795715332, 16.93996810913086, 17.511356353759766]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 10.0, 8.0, 13.0, 12.0, 23.0, 34.0, 58.0, 74.0, 130.0, 215.0, 337.0, 686.0, 1524.0, 3316.0, 7935.0, 20821.0, 60668.0, 187838.0, 387183.0, 248648.0, 83140.0, 27713.0, 10188.0, 4148.0, 1825.0, 890.0, 397.0, 265.0, 154.0, 98.0, 67.0, 44.0, 26.0, 19.0, 13.0, 12.0, 7.0, 2.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.525390625, -3.423614501953125, -3.32183837890625, -3.220062255859375, -3.1182861328125, -3.016510009765625, -2.91473388671875, -2.812957763671875, -2.711181640625, -2.609405517578125, -2.50762939453125, -2.405853271484375, -2.3040771484375, -2.202301025390625, -2.10052490234375, -1.998748779296875, -1.89697265625, -1.795196533203125, -1.69342041015625, -1.591644287109375, -1.4898681640625, -1.388092041015625, -1.28631591796875, -1.184539794921875, -1.082763671875, -0.980987548828125, -0.87921142578125, -0.777435302734375, -0.6756591796875, -0.573883056640625, -0.47210693359375, -0.370330810546875, -0.2685546875, -0.166778564453125, -0.06500244140625, 0.036773681640625, 0.1385498046875, 0.240325927734375, 0.34210205078125, 0.443878173828125, 0.545654296875, 0.647430419921875, 0.74920654296875, 0.850982666015625, 0.9527587890625, 1.054534912109375, 1.15631103515625, 1.258087158203125, 1.35986328125, 1.461639404296875, 1.56341552734375, 1.665191650390625, 1.7669677734375, 1.868743896484375, 1.97052001953125, 2.072296142578125, 2.174072265625, 2.275848388671875, 2.37762451171875, 2.479400634765625, 2.5811767578125, 2.682952880859375, 2.78472900390625, 2.886505126953125, 2.98828125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 10.0, 5.0, 9.0, 22.0, 24.0, 28.0, 36.0, 30.0, 36.0, 49.0, 50.0, 74.0, 81.0, 78.0, 67.0, 71.0, 71.0, 49.0, 42.0, 37.0, 30.0, 28.0, 30.0, 13.0, 11.0, 10.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.546875, -14.981689453125, -14.41650390625, -13.851318359375, -13.2861328125, -12.720947265625, -12.15576171875, -11.590576171875, -11.025390625, -10.460205078125, -9.89501953125, -9.329833984375, -8.7646484375, -8.199462890625, -7.63427734375, -7.069091796875, -6.50390625, -5.938720703125, -5.37353515625, -4.808349609375, -4.2431640625, -3.677978515625, -3.11279296875, -2.547607421875, -1.982421875, -1.417236328125, -0.85205078125, -0.286865234375, 0.2783203125, 0.843505859375, 1.40869140625, 1.973876953125, 2.5390625, 3.104248046875, 3.66943359375, 4.234619140625, 4.7998046875, 5.364990234375, 5.93017578125, 6.495361328125, 7.060546875, 7.625732421875, 8.19091796875, 8.756103515625, 9.3212890625, 9.886474609375, 10.45166015625, 11.016845703125, 11.58203125, 12.147216796875, 12.71240234375, 13.277587890625, 13.8427734375, 14.407958984375, 14.97314453125, 15.538330078125, 16.103515625, 16.668701171875, 17.23388671875, 17.799072265625, 18.3642578125, 18.929443359375, 19.49462890625, 20.059814453125, 20.625]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 8.0, 6.0, 12.0, 17.0, 19.0, 43.0, 75.0, 105.0, 229.0, 491.0, 945.0, 1873.0, 4099.0, 9310.0, 21571.0, 52818.0, 126814.0, 253085.0, 287240.0, 166349.0, 71585.0, 29050.0, 12299.0, 5428.0, 2553.0, 1209.0, 579.0, 310.0, 168.0, 103.0, 64.0, 34.0, 21.0, 14.0, 18.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6787109375, -1.6092376708984375, -1.539764404296875, -1.4702911376953125, -1.40081787109375, -1.3313446044921875, -1.261871337890625, -1.1923980712890625, -1.1229248046875, -1.0534515380859375, -0.983978271484375, -0.9145050048828125, -0.84503173828125, -0.7755584716796875, -0.706085205078125, -0.6366119384765625, -0.567138671875, -0.4976654052734375, -0.428192138671875, -0.3587188720703125, -0.28924560546875, -0.2197723388671875, -0.150299072265625, -0.0808258056640625, -0.0113525390625, 0.0581207275390625, 0.127593994140625, 0.1970672607421875, 0.26654052734375, 0.3360137939453125, 0.405487060546875, 0.4749603271484375, 0.54443359375, 0.6139068603515625, 0.683380126953125, 0.7528533935546875, 0.82232666015625, 0.8917999267578125, 0.961273193359375, 1.0307464599609375, 1.1002197265625, 1.1696929931640625, 1.239166259765625, 1.3086395263671875, 1.37811279296875, 1.4475860595703125, 1.517059326171875, 1.5865325927734375, 1.656005859375, 1.7254791259765625, 1.794952392578125, 1.8644256591796875, 1.93389892578125, 2.0033721923828125, 2.072845458984375, 2.1423187255859375, 2.2117919921875, 2.2812652587890625, 2.350738525390625, 2.4202117919921875, 2.48968505859375, 2.5591583251953125, 2.628631591796875, 2.6981048583984375, 2.767578125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 8.0, 9.0, 6.0, 4.0, 20.0, 19.0, 14.0, 23.0, 25.0, 29.0, 33.0, 42.0, 53.0, 61.0, 61.0, 49.0, 63.0, 69.0, 63.0, 57.0, 46.0, 44.0, 26.0, 35.0, 27.0, 27.0, 17.0, 16.0, 15.0, 16.0, 8.0, 8.0, 3.0, 7.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.96875, -22.9765625, -21.984375, -20.9921875, -20.0, -19.0078125, -18.015625, -17.0234375, -16.03125, -15.0390625, -14.046875, -13.0546875, -12.0625, -11.0703125, -10.078125, -9.0859375, -8.09375, -7.1015625, -6.109375, -5.1171875, -4.125, -3.1328125, -2.140625, -1.1484375, -0.15625, 0.8359375, 1.828125, 2.8203125, 3.8125, 4.8046875, 5.796875, 6.7890625, 7.78125, 8.7734375, 9.765625, 10.7578125, 11.75, 12.7421875, 13.734375, 14.7265625, 15.71875, 16.7109375, 17.703125, 18.6953125, 19.6875, 20.6796875, 21.671875, 22.6640625, 23.65625, 24.6484375, 25.640625, 26.6328125, 27.625, 28.6171875, 29.609375, 30.6015625, 31.59375, 32.5859375, 33.578125, 34.5703125, 35.5625, 36.5546875, 37.546875, 38.5390625, 39.53125]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 5.0, 8.0, 7.0, 14.0, 15.0, 20.0, 35.0, 34.0, 69.0, 80.0, 141.0, 208.0, 357.0, 543.0, 1017.0, 1952.0, 4506.0, 12625.0, 49940.0, 265583.0, 537393.0, 132063.0, 27184.0, 7941.0, 3134.0, 1470.0, 815.0, 502.0, 279.0, 184.0, 138.0, 101.0, 61.0, 45.0, 21.0, 22.0, 8.0, 9.0, 12.0, 7.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5302734375, -0.5133285522460938, -0.4963836669921875, -0.47943878173828125, -0.462493896484375, -0.44554901123046875, -0.4286041259765625, -0.41165924072265625, -0.39471435546875, -0.37776947021484375, -0.3608245849609375, -0.34387969970703125, -0.326934814453125, -0.30998992919921875, -0.2930450439453125, -0.27610015869140625, -0.2591552734375, -0.24221038818359375, -0.2252655029296875, -0.20832061767578125, -0.191375732421875, -0.17443084716796875, -0.1574859619140625, -0.14054107666015625, -0.12359619140625, -0.10665130615234375, -0.0897064208984375, -0.07276153564453125, -0.055816650390625, -0.03887176513671875, -0.0219268798828125, -0.00498199462890625, 0.011962890625, 0.02890777587890625, 0.0458526611328125, 0.06279754638671875, 0.079742431640625, 0.09668731689453125, 0.1136322021484375, 0.13057708740234375, 0.14752197265625, 0.16446685791015625, 0.1814117431640625, 0.19835662841796875, 0.215301513671875, 0.23224639892578125, 0.2491912841796875, 0.26613616943359375, 0.2830810546875, 0.30002593994140625, 0.3169708251953125, 0.33391571044921875, 0.350860595703125, 0.36780548095703125, 0.3847503662109375, 0.40169525146484375, 0.41864013671875, 0.43558502197265625, 0.4525299072265625, 0.46947479248046875, 0.486419677734375, 0.5033645629882812, 0.5203094482421875, 0.5372543334960938, 0.55419921875]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 7.0, 4.0, 11.0, 22.0, 28.0, 34.0, 40.0, 51.0, 73.0, 99.0, 85.0, 110.0, 108.0, 95.0, 57.0, 47.0, 34.0, 43.0, 18.0, 12.0, 7.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0004019737243652344, -0.00039266422390937805, -0.00038335472345352173, -0.0003740452229976654, -0.0003647357225418091, -0.00035542622208595276, -0.00034611672163009644, -0.0003368072211742401, -0.0003274977207183838, -0.00031818822026252747, -0.00030887871980667114, -0.0002995692193508148, -0.0002902597188949585, -0.00028095021843910217, -0.00027164071798324585, -0.0002623312175273895, -0.0002530217170715332, -0.00024371221661567688, -0.00023440271615982056, -0.00022509321570396423, -0.0002157837152481079, -0.0002064742147922516, -0.00019716471433639526, -0.00018785521388053894, -0.00017854571342468262, -0.0001692362129688263, -0.00015992671251296997, -0.00015061721205711365, -0.00014130771160125732, -0.000131998211145401, -0.00012268871068954468, -0.00011337921023368835, -0.00010406970977783203, -9.476020932197571e-05, -8.545070886611938e-05, -7.614120841026306e-05, -6.683170795440674e-05, -5.7522207498550415e-05, -4.821270704269409e-05, -3.890320658683777e-05, -2.9593706130981445e-05, -2.0284205675125122e-05, -1.0974705219268799e-05, -1.6652047634124756e-06, 7.644295692443848e-06, 1.695379614830017e-05, 2.6263296604156494e-05, 3.557279706001282e-05, 4.488229751586914e-05, 5.4191797971725464e-05, 6.350129842758179e-05, 7.281079888343811e-05, 8.212029933929443e-05, 9.142979979515076e-05, 0.00010073930025100708, 0.0001100488007068634, 0.00011935830116271973, 0.00012866780161857605, 0.00013797730207443237, 0.0001472868025302887, 0.00015659630298614502, 0.00016590580344200134, 0.00017521530389785767, 0.000184524804353714, 0.0001938343048095703]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 7.0, 7.0, 21.0, 12.0, 13.0, 27.0, 31.0, 49.0, 88.0, 116.0, 196.0, 438.0, 1074.0, 3044.0, 10354.0, 40955.0, 196089.0, 555193.0, 187090.0, 39141.0, 9663.0, 2903.0, 1029.0, 401.0, 219.0, 129.0, 70.0, 58.0, 31.0, 29.0, 19.0, 16.0, 7.0, 11.0, 7.0, 9.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4990234375, -0.4836616516113281, -0.46829986572265625, -0.4529380798339844, -0.4375762939453125, -0.4222145080566406, -0.40685272216796875, -0.3914909362792969, -0.376129150390625, -0.3607673645019531, -0.34540557861328125, -0.3300437927246094, -0.3146820068359375, -0.2993202209472656, -0.28395843505859375, -0.2685966491699219, -0.25323486328125, -0.23787307739257812, -0.22251129150390625, -0.20714950561523438, -0.1917877197265625, -0.17642593383789062, -0.16106414794921875, -0.14570236206054688, -0.130340576171875, -0.11497879028320312, -0.09961700439453125, -0.08425521850585938, -0.0688934326171875, -0.053531646728515625, -0.03816986083984375, -0.022808074951171875, -0.0074462890625, 0.007915496826171875, 0.02327728271484375, 0.038639068603515625, 0.0540008544921875, 0.06936264038085938, 0.08472442626953125, 0.10008621215820312, 0.115447998046875, 0.13080978393554688, 0.14617156982421875, 0.16153335571289062, 0.1768951416015625, 0.19225692749023438, 0.20761871337890625, 0.22298049926757812, 0.23834228515625, 0.2537040710449219, 0.26906585693359375, 0.2844276428222656, 0.2997894287109375, 0.3151512145996094, 0.33051300048828125, 0.3458747863769531, 0.361236572265625, 0.3765983581542969, 0.39196014404296875, 0.4073219299316406, 0.4226837158203125, 0.4380455017089844, 0.45340728759765625, 0.4687690734863281, 0.484130859375]}, "gradients/decoder.model.decoder.layers.6.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 4.0, 6.0, 6.0, 10.0, 14.0, 12.0, 14.0, 11.0, 14.0, 26.0, 43.0, 45.0, 66.0, 82.0, 76.0, 106.0, 89.0, 93.0, 58.0, 43.0, 33.0, 36.0, 37.0, 25.0, 9.0, 10.0, 7.0, 9.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.151123046875, -0.1458301544189453, -0.14053726196289062, -0.13524436950683594, -0.12995147705078125, -0.12465858459472656, -0.11936569213867188, -0.11407279968261719, -0.1087799072265625, -0.10348701477050781, -0.09819412231445312, -0.09290122985839844, -0.08760833740234375, -0.08231544494628906, -0.07702255249023438, -0.07172966003417969, -0.066436767578125, -0.06114387512207031, -0.055850982666015625, -0.05055809020996094, -0.04526519775390625, -0.03997230529785156, -0.034679412841796875, -0.029386520385742188, -0.0240936279296875, -0.018800735473632812, -0.013507843017578125, -0.008214950561523438, -0.00292205810546875, 0.0023708343505859375, 0.007663726806640625, 0.012956619262695312, 0.01824951171875, 0.023542404174804688, 0.028835296630859375, 0.03412818908691406, 0.03942108154296875, 0.04471397399902344, 0.050006866455078125, 0.05529975891113281, 0.0605926513671875, 0.06588554382324219, 0.07117843627929688, 0.07647132873535156, 0.08176422119140625, 0.08705711364746094, 0.09235000610351562, 0.09764289855957031, 0.102935791015625, 0.10822868347167969, 0.11352157592773438, 0.11881446838378906, 0.12410736083984375, 0.12940025329589844, 0.13469314575195312, 0.1399860382080078, 0.1452789306640625, 0.1505718231201172, 0.15586471557617188, 0.16115760803222656, 0.16645050048828125, 0.17174339294433594, 0.17703628540039062, 0.1823291778564453, 0.1876220703125]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 14.0, 46.0, 133.0, 295.0, 319.0, 145.0, 48.0, 8.0, 2.0, 3.0], "bins": [-94.42756652832031, -92.79834747314453, -91.16912841796875, -89.5399169921875, -87.91069793701172, -86.28147888183594, -84.65225982666016, -83.02304077148438, -81.3938217163086, -79.76460266113281, -78.13538360595703, -76.50616455078125, -74.876953125, -73.24773406982422, -71.61851501464844, -69.98929595947266, -68.36007690429688, -66.7308578491211, -65.10163879394531, -63.4724235534668, -61.843204498291016, -60.2139892578125, -58.58477020263672, -56.95555114746094, -55.32633972167969, -53.697120666503906, -52.06790542602539, -50.43868637084961, -48.80946731567383, -47.18025207519531, -45.55103302001953, -43.92181396484375, -42.29259490966797, -40.66337585449219, -39.03416061401367, -37.40494155883789, -35.77572250366211, -34.146507263183594, -32.51728820800781, -30.88806915283203, -29.25885009765625, -27.6296329498291, -26.00041389465332, -24.371196746826172, -22.74197769165039, -21.112760543823242, -19.483543395996094, -17.854324340820312, -16.225107192993164, -14.5958890914917, -12.966670989990234, -11.337453842163086, -9.708235740661621, -8.079017639160156, -6.449800491333008, -4.820582389831543, -3.191364288330078, -1.5621464252471924, 0.06707143783569336, 1.6962890625, 3.325507164001465, 4.95472526550293, 6.583942413330078, 8.213160514831543, 9.842378616333008]}, "gradients/decoder.model.decoder.layers.6.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 5.0, 6.0, 6.0, 7.0, 5.0, 14.0, 19.0, 18.0, 25.0, 29.0, 24.0, 26.0, 34.0, 38.0, 43.0, 47.0, 44.0, 69.0, 65.0, 69.0, 51.0, 48.0, 43.0, 53.0, 32.0, 26.0, 30.0, 28.0, 28.0, 13.0, 14.0, 7.0, 14.0, 7.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.694572448730469, -13.271334648132324, -12.84809684753418, -12.424860000610352, -12.001622200012207, -11.578384399414062, -11.155147552490234, -10.73190975189209, -10.308671951293945, -9.8854341506958, -9.462196350097656, -9.038959503173828, -8.615721702575684, -8.192483901977539, -7.769246578216553, -7.346009254455566, -6.922771453857422, -6.499533653259277, -6.076296329498291, -5.653059005737305, -5.22982120513916, -4.806583404541016, -4.383346080780029, -3.960108518600464, -3.5368709564208984, -3.113633394241333, -2.6903958320617676, -2.267158269882202, -1.8439207077026367, -1.4206831455230713, -0.9974455833435059, -0.5742080211639404, -0.1509695053100586, 0.27226805686950684, 0.6955056190490723, 1.1187431812286377, 1.5419807434082031, 1.9652183055877686, 2.388455867767334, 2.8116934299468994, 3.234930992126465, 3.6581685543060303, 4.081406116485596, 4.504643440246582, 4.927881240844727, 5.351119041442871, 5.774356365203857, 6.197593688964844, 6.620831489562988, 7.044069290161133, 7.467306613922119, 7.8905439376831055, 8.31378173828125, 8.737019538879395, 9.160257339477539, 9.583494186401367, 10.006731986999512, 10.429969787597656, 10.853206634521484, 11.276444435119629, 11.699682235717773, 12.122920036315918, 12.546157836914062, 12.96939468383789, 13.392632484436035]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 2.0, 7.0, 5.0, 6.0, 10.0, 15.0, 12.0, 23.0, 30.0, 24.0, 38.0, 61.0, 137.0, 315.0, 1153.0, 7718.0, 109366.0, 707703.0, 205846.0, 13530.0, 1703.0, 414.0, 142.0, 78.0, 48.0, 40.0, 30.0, 26.0, 17.0, 16.0, 4.0, 11.0, 6.0, 2.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.71875, -18.917724609375, -18.11669921875, -17.315673828125, -16.5146484375, -15.713623046875, -14.91259765625, -14.111572265625, -13.310546875, -12.509521484375, -11.70849609375, -10.907470703125, -10.1064453125, -9.305419921875, -8.50439453125, -7.703369140625, -6.90234375, -6.101318359375, -5.30029296875, -4.499267578125, -3.6982421875, -2.897216796875, -2.09619140625, -1.295166015625, -0.494140625, 0.306884765625, 1.10791015625, 1.908935546875, 2.7099609375, 3.510986328125, 4.31201171875, 5.113037109375, 5.9140625, 6.715087890625, 7.51611328125, 8.317138671875, 9.1181640625, 9.919189453125, 10.72021484375, 11.521240234375, 12.322265625, 13.123291015625, 13.92431640625, 14.725341796875, 15.5263671875, 16.327392578125, 17.12841796875, 17.929443359375, 18.73046875, 19.531494140625, 20.33251953125, 21.133544921875, 21.9345703125, 22.735595703125, 23.53662109375, 24.337646484375, 25.138671875, 25.939697265625, 26.74072265625, 27.541748046875, 28.3427734375, 29.143798828125, 29.94482421875, 30.745849609375, 31.546875]}, "gradients/decoder.model.decoder.layers.6.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 5.0, 6.0, 7.0, 11.0, 18.0, 15.0, 15.0, 22.0, 22.0, 32.0, 28.0, 45.0, 43.0, 32.0, 50.0, 80.0, 62.0, 68.0, 58.0, 54.0, 51.0, 35.0, 47.0, 41.0, 26.0, 28.0, 17.0, 20.0, 22.0, 13.0, 14.0, 7.0, 5.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.703125, -29.870849609375, -29.03857421875, -28.206298828125, -27.3740234375, -26.541748046875, -25.70947265625, -24.877197265625, -24.044921875, -23.212646484375, -22.38037109375, -21.548095703125, -20.7158203125, -19.883544921875, -19.05126953125, -18.218994140625, -17.38671875, -16.554443359375, -15.72216796875, -14.889892578125, -14.0576171875, -13.225341796875, -12.39306640625, -11.560791015625, -10.728515625, -9.896240234375, -9.06396484375, -8.231689453125, -7.3994140625, -6.567138671875, -5.73486328125, -4.902587890625, -4.0703125, -3.238037109375, -2.40576171875, -1.573486328125, -0.7412109375, 0.091064453125, 0.92333984375, 1.755615234375, 2.587890625, 3.420166015625, 4.25244140625, 5.084716796875, 5.9169921875, 6.749267578125, 7.58154296875, 8.413818359375, 9.24609375, 10.078369140625, 10.91064453125, 11.742919921875, 12.5751953125, 13.407470703125, 14.23974609375, 15.072021484375, 15.904296875, 16.736572265625, 17.56884765625, 18.401123046875, 19.2333984375, 20.065673828125, 20.89794921875, 21.730224609375, 22.5625]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 7.0, 10.0, 17.0, 10.0, 19.0, 24.0, 25.0, 40.0, 59.0, 76.0, 114.0, 170.0, 251.0, 478.0, 1768.0, 24546.0, 754050.0, 258522.0, 6409.0, 875.0, 384.0, 191.0, 112.0, 107.0, 67.0, 47.0, 34.0, 33.0, 28.0, 18.0, 11.0, 16.0, 8.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 3.0], "bins": [-38.46875, -37.39404296875, -36.3193359375, -35.24462890625, -34.169921875, -33.09521484375, -32.0205078125, -30.94580078125, -29.87109375, -28.79638671875, -27.7216796875, -26.64697265625, -25.572265625, -24.49755859375, -23.4228515625, -22.34814453125, -21.2734375, -20.19873046875, -19.1240234375, -18.04931640625, -16.974609375, -15.89990234375, -14.8251953125, -13.75048828125, -12.67578125, -11.60107421875, -10.5263671875, -9.45166015625, -8.376953125, -7.30224609375, -6.2275390625, -5.15283203125, -4.078125, -3.00341796875, -1.9287109375, -0.85400390625, 0.220703125, 1.29541015625, 2.3701171875, 3.44482421875, 4.51953125, 5.59423828125, 6.6689453125, 7.74365234375, 8.818359375, 9.89306640625, 10.9677734375, 12.04248046875, 13.1171875, 14.19189453125, 15.2666015625, 16.34130859375, 17.416015625, 18.49072265625, 19.5654296875, 20.64013671875, 21.71484375, 22.78955078125, 23.8642578125, 24.93896484375, 26.013671875, 27.08837890625, 28.1630859375, 29.23779296875, 30.3125]}, "gradients/decoder.model.decoder.layers.6.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 3.0, 5.0, 4.0, 5.0, 13.0, 14.0, 14.0, 21.0, 14.0, 28.0, 26.0, 27.0, 35.0, 34.0, 31.0, 44.0, 46.0, 42.0, 53.0, 48.0, 57.0, 41.0, 47.0, 26.0, 35.0, 43.0, 40.0, 28.0, 36.0, 23.0, 26.0, 7.0, 16.0, 12.0, 14.0, 11.0, 7.0, 2.0, 4.0, 5.0, 7.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-29.375, -28.525634765625, -27.67626953125, -26.826904296875, -25.9775390625, -25.128173828125, -24.27880859375, -23.429443359375, -22.580078125, -21.730712890625, -20.88134765625, -20.031982421875, -19.1826171875, -18.333251953125, -17.48388671875, -16.634521484375, -15.78515625, -14.935791015625, -14.08642578125, -13.237060546875, -12.3876953125, -11.538330078125, -10.68896484375, -9.839599609375, -8.990234375, -8.140869140625, -7.29150390625, -6.442138671875, -5.5927734375, -4.743408203125, -3.89404296875, -3.044677734375, -2.1953125, -1.345947265625, -0.49658203125, 0.352783203125, 1.2021484375, 2.051513671875, 2.90087890625, 3.750244140625, 4.599609375, 5.448974609375, 6.29833984375, 7.147705078125, 7.9970703125, 8.846435546875, 9.69580078125, 10.545166015625, 11.39453125, 12.243896484375, 13.09326171875, 13.942626953125, 14.7919921875, 15.641357421875, 16.49072265625, 17.340087890625, 18.189453125, 19.038818359375, 19.88818359375, 20.737548828125, 21.5869140625, 22.436279296875, 23.28564453125, 24.135009765625, 24.984375]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 5.0, 2.0, 3.0, 4.0, 15.0, 14.0, 27.0, 40.0, 67.0, 159.0, 532.0, 2391.0, 14003.0, 778973.0, 242938.0, 7387.0, 1372.0, 352.0, 113.0, 71.0, 22.0, 22.0, 9.0, 10.0, 4.0, 4.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.59375, -14.050048828125, -13.50634765625, -12.962646484375, -12.4189453125, -11.875244140625, -11.33154296875, -10.787841796875, -10.244140625, -9.700439453125, -9.15673828125, -8.613037109375, -8.0693359375, -7.525634765625, -6.98193359375, -6.438232421875, -5.89453125, -5.350830078125, -4.80712890625, -4.263427734375, -3.7197265625, -3.176025390625, -2.63232421875, -2.088623046875, -1.544921875, -1.001220703125, -0.45751953125, 0.086181640625, 0.6298828125, 1.173583984375, 1.71728515625, 2.260986328125, 2.8046875, 3.348388671875, 3.89208984375, 4.435791015625, 4.9794921875, 5.523193359375, 6.06689453125, 6.610595703125, 7.154296875, 7.697998046875, 8.24169921875, 8.785400390625, 9.3291015625, 9.872802734375, 10.41650390625, 10.960205078125, 11.50390625, 12.047607421875, 12.59130859375, 13.135009765625, 13.6787109375, 14.222412109375, 14.76611328125, 15.309814453125, 15.853515625, 16.397216796875, 16.94091796875, 17.484619140625, 18.0283203125, 18.572021484375, 19.11572265625, 19.659423828125, 20.203125]}, "gradients/decoder.model.decoder.layers.6.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 7.0, 12.0, 30.0, 41.0, 74.0, 144.0, 208.0, 171.0, 117.0, 80.0, 50.0, 27.0, 11.0, 9.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00252532958984375, -0.0024619102478027344, -0.0023984909057617188, -0.002335071563720703, -0.0022716522216796875, -0.002208232879638672, -0.0021448135375976562, -0.0020813941955566406, -0.002017974853515625, -0.0019545555114746094, -0.0018911361694335938, -0.0018277168273925781, -0.0017642974853515625, -0.0017008781433105469, -0.0016374588012695312, -0.0015740394592285156, -0.0015106201171875, -0.0014472007751464844, -0.0013837814331054688, -0.0013203620910644531, -0.0012569427490234375, -0.0011935234069824219, -0.0011301040649414062, -0.0010666847229003906, -0.001003265380859375, -0.0009398460388183594, -0.0008764266967773438, -0.0008130073547363281, -0.0007495880126953125, -0.0006861686706542969, -0.0006227493286132812, -0.0005593299865722656, -0.00049591064453125, -0.0004324913024902344, -0.00036907196044921875, -0.0003056526184082031, -0.0002422332763671875, -0.00017881393432617188, -0.00011539459228515625, -5.1975250244140625e-05, 1.1444091796875e-05, 7.486343383789062e-05, 0.00013828277587890625, 0.00020170211791992188, 0.0002651214599609375, 0.0003285408020019531, 0.00039196014404296875, 0.0004553794860839844, 0.000518798828125, 0.0005822181701660156, 0.0006456375122070312, 0.0007090568542480469, 0.0007724761962890625, 0.0008358955383300781, 0.0008993148803710938, 0.0009627342224121094, 0.001026153564453125, 0.0010895729064941406, 0.0011529922485351562, 0.0012164115905761719, 0.0012798309326171875, 0.0013432502746582031, 0.0014066696166992188, 0.0014700889587402344, 0.00153350830078125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 6.0, 6.0, 8.0, 16.0, 37.0, 36.0, 56.0, 67.0, 156.0, 352.0, 1245.0, 7584.0, 330337.0, 692505.0, 13534.0, 1708.0, 442.0, 183.0, 109.0, 61.0, 38.0, 22.0, 11.0, 9.0, 8.0, 4.0, 4.0, 1.0, 2.0, 5.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.890625, -16.3804931640625, -15.870361328125, -15.3602294921875, -14.85009765625, -14.3399658203125, -13.829833984375, -13.3197021484375, -12.8095703125, -12.2994384765625, -11.789306640625, -11.2791748046875, -10.76904296875, -10.2589111328125, -9.748779296875, -9.2386474609375, -8.728515625, -8.2183837890625, -7.708251953125, -7.1981201171875, -6.68798828125, -6.1778564453125, -5.667724609375, -5.1575927734375, -4.6474609375, -4.1373291015625, -3.627197265625, -3.1170654296875, -2.60693359375, -2.0968017578125, -1.586669921875, -1.0765380859375, -0.56640625, -0.0562744140625, 0.453857421875, 0.9639892578125, 1.47412109375, 1.9842529296875, 2.494384765625, 3.0045166015625, 3.5146484375, 4.0247802734375, 4.534912109375, 5.0450439453125, 5.55517578125, 6.0653076171875, 6.575439453125, 7.0855712890625, 7.595703125, 8.1058349609375, 8.615966796875, 9.1260986328125, 9.63623046875, 10.1463623046875, 10.656494140625, 11.1666259765625, 11.6767578125, 12.1868896484375, 12.697021484375, 13.2071533203125, 13.71728515625, 14.2274169921875, 14.737548828125, 15.2476806640625, 15.7578125]}, "gradients/decoder.model.decoder.layers.6.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 6.0, 3.0, 5.0, 13.0, 23.0, 24.0, 35.0, 47.0, 51.0, 49.0, 78.0, 90.0, 79.0, 94.0, 89.0, 74.0, 55.0, 42.0, 38.0, 22.0, 18.0, 14.0, 15.0, 9.0, 9.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4765625, -2.387908935546875, -2.29925537109375, -2.210601806640625, -2.1219482421875, -2.033294677734375, -1.94464111328125, -1.855987548828125, -1.767333984375, -1.678680419921875, -1.59002685546875, -1.501373291015625, -1.4127197265625, -1.324066162109375, -1.23541259765625, -1.146759033203125, -1.05810546875, -0.969451904296875, -0.88079833984375, -0.792144775390625, -0.7034912109375, -0.614837646484375, -0.52618408203125, -0.437530517578125, -0.348876953125, -0.260223388671875, -0.17156982421875, -0.082916259765625, 0.0057373046875, 0.094390869140625, 0.18304443359375, 0.271697998046875, 0.3603515625, 0.449005126953125, 0.53765869140625, 0.626312255859375, 0.7149658203125, 0.803619384765625, 0.89227294921875, 0.980926513671875, 1.069580078125, 1.158233642578125, 1.24688720703125, 1.335540771484375, 1.4241943359375, 1.512847900390625, 1.60150146484375, 1.690155029296875, 1.77880859375, 1.867462158203125, 1.95611572265625, 2.044769287109375, 2.1334228515625, 2.222076416015625, 2.31072998046875, 2.399383544921875, 2.488037109375, 2.576690673828125, 2.66534423828125, 2.753997802734375, 2.8426513671875, 2.931304931640625, 3.01995849609375, 3.108612060546875, 3.197265625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 12.0, 30.0, 60.0, 116.0, 189.0, 215.0, 200.0, 95.0, 55.0, 16.0, 6.0, 8.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.32645416259766, -91.21869659423828, -89.1109390258789, -87.00318908691406, -84.89543151855469, -82.78767395019531, -80.67991638183594, -78.57215881347656, -76.46440124511719, -74.35664367675781, -72.24888610839844, -70.1411361694336, -68.03337860107422, -65.92562103271484, -63.81786346435547, -61.710105895996094, -59.60235595703125, -57.494598388671875, -55.386844635009766, -53.27908706665039, -51.17133331298828, -49.063575744628906, -46.95581817626953, -44.848060607910156, -42.74030685424805, -40.63254928588867, -38.52479553222656, -36.41703796386719, -34.30928039550781, -32.2015266418457, -30.093769073486328, -27.986013412475586, -25.878250122070312, -23.77049446105957, -21.662738800048828, -19.554981231689453, -17.44722557067871, -15.339469909667969, -13.23171329498291, -11.123956680297852, -9.01620101928711, -6.908444881439209, -4.800688743591309, -2.692932605743408, -0.5851764678955078, 1.5225791931152344, 3.630335807800293, 5.738092422485352, 7.845848083496094, 9.953603744506836, 12.061360359191895, 14.169116973876953, 16.276872634887695, 18.384628295898438, 20.492385864257812, 22.600141525268555, 24.707897186279297, 26.81565284729004, 28.92340850830078, 31.031166076660156, 33.13892364501953, 35.24667739868164, 37.354434967041016, 39.462188720703125, 41.5699462890625]}, "gradients/decoder.model.decoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 7.0, 4.0, 5.0, 6.0, 3.0, 7.0, 11.0, 10.0, 7.0, 21.0, 11.0, 29.0, 28.0, 27.0, 27.0, 37.0, 43.0, 39.0, 45.0, 22.0, 41.0, 39.0, 45.0, 39.0, 39.0, 42.0, 42.0, 40.0, 37.0, 32.0, 34.0, 24.0, 26.0, 20.0, 16.0, 16.0, 11.0, 17.0, 16.0, 7.0, 12.0, 6.0, 3.0, 4.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.62914276123047, -42.215328216552734, -40.801517486572266, -39.38770294189453, -37.9738883972168, -36.56007766723633, -35.146263122558594, -33.732452392578125, -32.31863784790039, -30.90482521057129, -29.491010665893555, -28.077198028564453, -26.66338539123535, -25.24957275390625, -23.835758209228516, -22.421945571899414, -21.00813102722168, -19.594318389892578, -18.180503845214844, -16.766691207885742, -15.35287857055664, -13.939064979553223, -12.525251388549805, -11.111438751220703, -9.697625160217285, -8.283811569213867, -6.869998931884766, -5.456185340881348, -4.042372226715088, -2.628559112548828, -1.2147455215454102, 0.1990671157836914, 1.6128807067871094, 3.026693820953369, 4.440506935119629, 5.854320526123047, 7.268133640289307, 8.681946754455566, 10.095760345458984, 11.509572982788086, 12.923386573791504, 14.337200164794922, 15.751012802124023, 17.164825439453125, 18.57863998413086, 19.99245262145996, 21.406265258789062, 22.820079803466797, 24.2338924407959, 25.647705078125, 27.061519622802734, 28.475332260131836, 29.889144897460938, 31.302959442138672, 32.716773986816406, 34.130584716796875, 35.54439926147461, 36.958213806152344, 38.37202453613281, 39.78583908081055, 41.19965362548828, 42.61346435546875, 44.027278900146484, 45.44109344482422, 46.85490417480469]}, "gradients/decoder.model.decoder.layers.5.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 3.0, 11.0, 15.0, 16.0, 29.0, 38.0, 39.0, 67.0, 106.0, 154.0, 226.0, 379.0, 699.0, 1921.0, 19301.0, 932771.0, 3117338.0, 114929.0, 4470.0, 823.0, 378.0, 207.0, 108.0, 86.0, 55.0, 27.0, 25.0, 18.0, 13.0, 17.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.40625, -47.172607421875, -45.93896484375, -44.705322265625, -43.4716796875, -42.238037109375, -41.00439453125, -39.770751953125, -38.537109375, -37.303466796875, -36.06982421875, -34.836181640625, -33.6025390625, -32.368896484375, -31.13525390625, -29.901611328125, -28.66796875, -27.434326171875, -26.20068359375, -24.967041015625, -23.7333984375, -22.499755859375, -21.26611328125, -20.032470703125, -18.798828125, -17.565185546875, -16.33154296875, -15.097900390625, -13.8642578125, -12.630615234375, -11.39697265625, -10.163330078125, -8.9296875, -7.696044921875, -6.46240234375, -5.228759765625, -3.9951171875, -2.761474609375, -1.52783203125, -0.294189453125, 0.939453125, 2.173095703125, 3.40673828125, 4.640380859375, 5.8740234375, 7.107666015625, 8.34130859375, 9.574951171875, 10.80859375, 12.042236328125, 13.27587890625, 14.509521484375, 15.7431640625, 16.976806640625, 18.21044921875, 19.444091796875, 20.677734375, 21.911376953125, 23.14501953125, 24.378662109375, 25.6123046875, 26.845947265625, 28.07958984375, 29.313232421875, 30.546875]}, "gradients/decoder.model.decoder.layers.5.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 2.0, 4.0, 10.0, 11.0, 5.0, 10.0, 14.0, 18.0, 26.0, 25.0, 31.0, 39.0, 41.0, 54.0, 49.0, 52.0, 59.0, 60.0, 45.0, 52.0, 53.0, 48.0, 47.0, 36.0, 34.0, 24.0, 30.0, 29.0, 25.0, 18.0, 14.0, 6.0, 6.0, 3.0, 7.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.046875, -15.5263671875, -15.005859375, -14.4853515625, -13.96484375, -13.4443359375, -12.923828125, -12.4033203125, -11.8828125, -11.3623046875, -10.841796875, -10.3212890625, -9.80078125, -9.2802734375, -8.759765625, -8.2392578125, -7.71875, -7.1982421875, -6.677734375, -6.1572265625, -5.63671875, -5.1162109375, -4.595703125, -4.0751953125, -3.5546875, -3.0341796875, -2.513671875, -1.9931640625, -1.47265625, -0.9521484375, -0.431640625, 0.0888671875, 0.609375, 1.1298828125, 1.650390625, 2.1708984375, 2.69140625, 3.2119140625, 3.732421875, 4.2529296875, 4.7734375, 5.2939453125, 5.814453125, 6.3349609375, 6.85546875, 7.3759765625, 7.896484375, 8.4169921875, 8.9375, 9.4580078125, 9.978515625, 10.4990234375, 11.01953125, 11.5400390625, 12.060546875, 12.5810546875, 13.1015625, 13.6220703125, 14.142578125, 14.6630859375, 15.18359375, 15.7041015625, 16.224609375, 16.7451171875, 17.265625]}, "gradients/decoder.model.decoder.layers.5.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 9.0, 6.0, 10.0, 12.0, 23.0, 36.0, 76.0, 123.0, 236.0, 445.0, 829.0, 1940.0, 6460.0, 45636.0, 941931.0, 3009107.0, 166877.0, 14770.0, 3256.0, 1219.0, 596.0, 283.0, 163.0, 71.0, 47.0, 49.0, 23.0, 20.0, 7.0, 4.0, 6.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.15625, -21.3984375, -20.640625, -19.8828125, -19.125, -18.3671875, -17.609375, -16.8515625, -16.09375, -15.3359375, -14.578125, -13.8203125, -13.0625, -12.3046875, -11.546875, -10.7890625, -10.03125, -9.2734375, -8.515625, -7.7578125, -7.0, -6.2421875, -5.484375, -4.7265625, -3.96875, -3.2109375, -2.453125, -1.6953125, -0.9375, -0.1796875, 0.578125, 1.3359375, 2.09375, 2.8515625, 3.609375, 4.3671875, 5.125, 5.8828125, 6.640625, 7.3984375, 8.15625, 8.9140625, 9.671875, 10.4296875, 11.1875, 11.9453125, 12.703125, 13.4609375, 14.21875, 14.9765625, 15.734375, 16.4921875, 17.25, 18.0078125, 18.765625, 19.5234375, 20.28125, 21.0390625, 21.796875, 22.5546875, 23.3125, 24.0703125, 24.828125, 25.5859375, 26.34375]}, "gradients/decoder.model.decoder.layers.5.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 9.0, 11.0, 5.0, 17.0, 35.0, 42.0, 90.0, 129.0, 184.0, 308.0, 460.0, 588.0, 667.0, 519.0, 367.0, 225.0, 158.0, 96.0, 64.0, 48.0, 22.0, 11.0, 4.0, 8.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84765625, -7.603515625, -7.359375, -7.115234375, -6.87109375, -6.626953125, -6.3828125, -6.138671875, -5.89453125, -5.650390625, -5.40625, -5.162109375, -4.91796875, -4.673828125, -4.4296875, -4.185546875, -3.94140625, -3.697265625, -3.453125, -3.208984375, -2.96484375, -2.720703125, -2.4765625, -2.232421875, -1.98828125, -1.744140625, -1.5, -1.255859375, -1.01171875, -0.767578125, -0.5234375, -0.279296875, -0.03515625, 0.208984375, 0.453125, 0.697265625, 0.94140625, 1.185546875, 1.4296875, 1.673828125, 1.91796875, 2.162109375, 2.40625, 2.650390625, 2.89453125, 3.138671875, 3.3828125, 3.626953125, 3.87109375, 4.115234375, 4.359375, 4.603515625, 4.84765625, 5.091796875, 5.3359375, 5.580078125, 5.82421875, 6.068359375, 6.3125, 6.556640625, 6.80078125, 7.044921875, 7.2890625, 7.533203125, 7.77734375]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 7.0, 6.0, 4.0, 7.0, 13.0, 17.0, 34.0, 51.0, 56.0, 64.0, 77.0, 95.0, 89.0, 114.0, 104.0, 83.0, 62.0, 39.0, 36.0, 15.0, 15.0, 10.0, 6.0, 2.0, 1.0, 1.0, 4.0], "bins": [-39.11771011352539, -38.32426834106445, -37.53082275390625, -36.73738098144531, -35.943939208984375, -35.15049743652344, -34.357051849365234, -33.5636100769043, -32.77016830444336, -31.97672462463379, -31.18328285217285, -30.38983917236328, -29.596397399902344, -28.802953720092773, -28.009510040283203, -27.216068267822266, -26.422624588012695, -25.629180908203125, -24.835739135742188, -24.042295455932617, -23.24885368347168, -22.45541000366211, -21.661968231201172, -20.8685245513916, -20.07508087158203, -19.28163719177246, -18.488195419311523, -17.694751739501953, -16.901309967041016, -16.107866287231445, -15.314423561096191, -14.520980834960938, -13.727537155151367, -12.934094429016113, -12.14065170288086, -11.347208023071289, -10.553766250610352, -9.760322570800781, -8.966879844665527, -8.173437118530273, -7.3799943923950195, -6.586551666259766, -5.793108940124512, -4.9996657371521, -4.206223011016846, -3.412780284881592, -2.6193370819091797, -1.8258943557739258, -1.0324516296386719, -0.23900878429412842, 0.554434061050415, 1.347877025604248, 2.141319751739502, 2.934762477874756, 3.728205680847168, 4.521648406982422, 5.315091133117676, 6.10853385925293, 6.901976585388184, 7.695419788360596, 8.488862991333008, 9.282304763793945, 10.075748443603516, 10.86919116973877, 11.662633895874023]}, "gradients/decoder.model.decoder.layers.5.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 5.0, 4.0, 6.0, 7.0, 7.0, 17.0, 10.0, 23.0, 24.0, 24.0, 21.0, 18.0, 43.0, 22.0, 43.0, 41.0, 42.0, 44.0, 53.0, 34.0, 41.0, 39.0, 37.0, 44.0, 42.0, 38.0, 41.0, 31.0, 27.0, 26.0, 21.0, 22.0, 20.0, 18.0, 13.0, 6.0, 9.0, 10.0, 6.0, 5.0, 6.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.42003345489502, -12.939018249511719, -12.458003044128418, -11.976987838745117, -11.495973587036133, -11.014957427978516, -10.533943176269531, -10.05292797088623, -9.57191276550293, -9.090897560119629, -8.609882354736328, -8.128867149353027, -7.647852420806885, -7.166837215423584, -6.685822486877441, -6.204807281494141, -5.72379207611084, -5.242776870727539, -4.761761665344238, -4.280746936798096, -3.799731731414795, -3.318716526031494, -2.8377015590667725, -2.356686592102051, -1.87567138671875, -1.3946563005447388, -0.9136412143707275, -0.4326261281967163, 0.04838895797729492, 0.5294041633605957, 1.0104191303253174, 1.491434097290039, 1.9724483489990234, 2.453463554382324, 2.934478521347046, 3.4154934883117676, 3.8965086936950684, 4.377523899078369, 4.858538627624512, 5.3395538330078125, 5.820569038391113, 6.301584243774414, 6.782599449157715, 7.263614177703857, 7.744629383087158, 8.225645065307617, 8.706659317016602, 9.187674522399902, 9.668689727783203, 10.149704933166504, 10.630720138549805, 11.111735343933105, 11.592750549316406, 12.07376480102539, 12.554780006408691, 13.035795211791992, 13.516810417175293, 13.997825622558594, 14.478840827941895, 14.959856033325195, 15.44087028503418, 15.921886444091797, 16.40290069580078, 16.883914947509766, 17.364931106567383]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 8.0, 7.0, 8.0, 11.0, 11.0, 13.0, 25.0, 29.0, 43.0, 79.0, 114.0, 177.0, 308.0, 495.0, 865.0, 1537.0, 2913.0, 5662.0, 11307.0, 23302.0, 48656.0, 102652.0, 196778.0, 262799.0, 194768.0, 101703.0, 48097.0, 22889.0, 11069.0, 5596.0, 2975.0, 1579.0, 853.0, 483.0, 269.0, 185.0, 96.0, 63.0, 32.0, 27.0, 26.0, 12.0, 14.0, 4.0, 2.0, 8.0, 5.0, 4.0, 2.0, 2.0, 1.0, 2.0], "bins": [-2.14453125, -2.0841064453125, -2.023681640625, -1.9632568359375, -1.90283203125, -1.8424072265625, -1.781982421875, -1.7215576171875, -1.6611328125, -1.6007080078125, -1.540283203125, -1.4798583984375, -1.41943359375, -1.3590087890625, -1.298583984375, -1.2381591796875, -1.177734375, -1.1173095703125, -1.056884765625, -0.9964599609375, -0.93603515625, -0.8756103515625, -0.815185546875, -0.7547607421875, -0.6943359375, -0.6339111328125, -0.573486328125, -0.5130615234375, -0.45263671875, -0.3922119140625, -0.331787109375, -0.2713623046875, -0.2109375, -0.1505126953125, -0.090087890625, -0.0296630859375, 0.03076171875, 0.0911865234375, 0.151611328125, 0.2120361328125, 0.2724609375, 0.3328857421875, 0.393310546875, 0.4537353515625, 0.51416015625, 0.5745849609375, 0.635009765625, 0.6954345703125, 0.755859375, 0.8162841796875, 0.876708984375, 0.9371337890625, 0.99755859375, 1.0579833984375, 1.118408203125, 1.1788330078125, 1.2392578125, 1.2996826171875, 1.360107421875, 1.4205322265625, 1.48095703125, 1.5413818359375, 1.601806640625, 1.6622314453125, 1.72265625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 1.0, 1.0, 9.0, 3.0, 5.0, 8.0, 12.0, 15.0, 26.0, 14.0, 29.0, 29.0, 32.0, 38.0, 42.0, 55.0, 54.0, 63.0, 44.0, 55.0, 45.0, 50.0, 50.0, 41.0, 54.0, 39.0, 33.0, 31.0, 19.0, 25.0, 19.0, 14.0, 8.0, 10.0, 7.0, 6.0, 7.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.92431640625, -9.5361328125, -9.14794921875, -8.759765625, -8.37158203125, -7.9833984375, -7.59521484375, -7.20703125, -6.81884765625, -6.4306640625, -6.04248046875, -5.654296875, -5.26611328125, -4.8779296875, -4.48974609375, -4.1015625, -3.71337890625, -3.3251953125, -2.93701171875, -2.548828125, -2.16064453125, -1.7724609375, -1.38427734375, -0.99609375, -0.60791015625, -0.2197265625, 0.16845703125, 0.556640625, 0.94482421875, 1.3330078125, 1.72119140625, 2.109375, 2.49755859375, 2.8857421875, 3.27392578125, 3.662109375, 4.05029296875, 4.4384765625, 4.82666015625, 5.21484375, 5.60302734375, 5.9912109375, 6.37939453125, 6.767578125, 7.15576171875, 7.5439453125, 7.93212890625, 8.3203125, 8.70849609375, 9.0966796875, 9.48486328125, 9.873046875, 10.26123046875, 10.6494140625, 11.03759765625, 11.42578125, 11.81396484375, 12.2021484375, 12.59033203125, 12.978515625, 13.36669921875, 13.7548828125, 14.14306640625, 14.53125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 7.0, 8.0, 6.0, 16.0, 18.0, 28.0, 46.0, 67.0, 83.0, 108.0, 187.0, 318.0, 478.0, 770.0, 1242.0, 1938.0, 3168.0, 5278.0, 9051.0, 15336.0, 27081.0, 48028.0, 84719.0, 142115.0, 198952.0, 193477.0, 132693.0, 78576.0, 44324.0, 24948.0, 14359.0, 8291.0, 4972.0, 2975.0, 1845.0, 1096.0, 709.0, 440.0, 257.0, 179.0, 117.0, 82.0, 58.0, 28.0, 20.0, 23.0, 11.0, 14.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 1.0], "bins": [-1.4033203125, -1.359375, -1.3154296875, -1.271484375, -1.2275390625, -1.18359375, -1.1396484375, -1.095703125, -1.0517578125, -1.0078125, -0.9638671875, -0.919921875, -0.8759765625, -0.83203125, -0.7880859375, -0.744140625, -0.7001953125, -0.65625, -0.6123046875, -0.568359375, -0.5244140625, -0.48046875, -0.4365234375, -0.392578125, -0.3486328125, -0.3046875, -0.2607421875, -0.216796875, -0.1728515625, -0.12890625, -0.0849609375, -0.041015625, 0.0029296875, 0.046875, 0.0908203125, 0.134765625, 0.1787109375, 0.22265625, 0.2666015625, 0.310546875, 0.3544921875, 0.3984375, 0.4423828125, 0.486328125, 0.5302734375, 0.57421875, 0.6181640625, 0.662109375, 0.7060546875, 0.75, 0.7939453125, 0.837890625, 0.8818359375, 0.92578125, 0.9697265625, 1.013671875, 1.0576171875, 1.1015625, 1.1455078125, 1.189453125, 1.2333984375, 1.27734375, 1.3212890625, 1.365234375, 1.4091796875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 2.0, 7.0, 8.0, 8.0, 8.0, 7.0, 7.0, 10.0, 15.0, 14.0, 18.0, 26.0, 17.0, 28.0, 29.0, 35.0, 35.0, 46.0, 41.0, 46.0, 51.0, 32.0, 49.0, 45.0, 56.0, 37.0, 37.0, 34.0, 46.0, 28.0, 25.0, 23.0, 14.0, 23.0, 18.0, 8.0, 14.0, 14.0, 5.0, 14.0, 5.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-24.046875, -23.297607421875, -22.54833984375, -21.799072265625, -21.0498046875, -20.300537109375, -19.55126953125, -18.802001953125, -18.052734375, -17.303466796875, -16.55419921875, -15.804931640625, -15.0556640625, -14.306396484375, -13.55712890625, -12.807861328125, -12.05859375, -11.309326171875, -10.56005859375, -9.810791015625, -9.0615234375, -8.312255859375, -7.56298828125, -6.813720703125, -6.064453125, -5.315185546875, -4.56591796875, -3.816650390625, -3.0673828125, -2.318115234375, -1.56884765625, -0.819580078125, -0.0703125, 0.678955078125, 1.42822265625, 2.177490234375, 2.9267578125, 3.676025390625, 4.42529296875, 5.174560546875, 5.923828125, 6.673095703125, 7.42236328125, 8.171630859375, 8.9208984375, 9.670166015625, 10.41943359375, 11.168701171875, 11.91796875, 12.667236328125, 13.41650390625, 14.165771484375, 14.9150390625, 15.664306640625, 16.41357421875, 17.162841796875, 17.912109375, 18.661376953125, 19.41064453125, 20.159912109375, 20.9091796875, 21.658447265625, 22.40771484375, 23.156982421875, 23.90625]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 5.0, 8.0, 7.0, 7.0, 12.0, 22.0, 18.0, 24.0, 44.0, 51.0, 62.0, 90.0, 122.0, 170.0, 256.0, 415.0, 650.0, 1209.0, 2217.0, 4554.0, 11784.0, 37466.0, 144059.0, 486328.0, 262273.0, 65210.0, 18181.0, 6583.0, 2825.0, 1494.0, 837.0, 526.0, 299.0, 220.0, 136.0, 113.0, 78.0, 53.0, 31.0, 31.0, 16.0, 23.0, 16.0, 10.0, 7.0, 4.0, 7.0, 3.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.335693359375, -0.32439422607421875, -0.3130950927734375, -0.30179595947265625, -0.290496826171875, -0.27919769287109375, -0.2678985595703125, -0.25659942626953125, -0.24530029296875, -0.23400115966796875, -0.2227020263671875, -0.21140289306640625, -0.200103759765625, -0.18880462646484375, -0.1775054931640625, -0.16620635986328125, -0.1549072265625, -0.14360809326171875, -0.1323089599609375, -0.12100982666015625, -0.109710693359375, -0.09841156005859375, -0.0871124267578125, -0.07581329345703125, -0.06451416015625, -0.05321502685546875, -0.0419158935546875, -0.03061676025390625, -0.019317626953125, -0.00801849365234375, 0.0032806396484375, 0.01457977294921875, 0.02587890625, 0.03717803955078125, 0.0484771728515625, 0.05977630615234375, 0.071075439453125, 0.08237457275390625, 0.0936737060546875, 0.10497283935546875, 0.11627197265625, 0.12757110595703125, 0.1388702392578125, 0.15016937255859375, 0.161468505859375, 0.17276763916015625, 0.1840667724609375, 0.19536590576171875, 0.2066650390625, 0.21796417236328125, 0.2292633056640625, 0.24056243896484375, 0.251861572265625, 0.26316070556640625, 0.2744598388671875, 0.28575897216796875, 0.29705810546875, 0.30835723876953125, 0.3196563720703125, 0.33095550537109375, 0.342254638671875, 0.35355377197265625, 0.3648529052734375, 0.37615203857421875, 0.387451171875]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 3.0, 8.0, 13.0, 17.0, 21.0, 31.0, 32.0, 70.0, 83.0, 77.0, 94.0, 113.0, 104.0, 79.0, 71.0, 43.0, 40.0, 19.0, 15.0, 15.0, 17.0, 6.0, 8.0, 3.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00023055076599121094, -0.00022336095571517944, -0.00021617114543914795, -0.00020898133516311646, -0.00020179152488708496, -0.00019460171461105347, -0.00018741190433502197, -0.00018022209405899048, -0.00017303228378295898, -0.0001658424735069275, -0.000158652663230896, -0.0001514628529548645, -0.000144273042678833, -0.00013708323240280151, -0.00012989342212677002, -0.00012270361185073853, -0.00011551380157470703, -0.00010832399129867554, -0.00010113418102264404, -9.394437074661255e-05, -8.675456047058105e-05, -7.956475019454956e-05, -7.237493991851807e-05, -6.518512964248657e-05, -5.799531936645508e-05, -5.0805509090423584e-05, -4.361569881439209e-05, -3.6425888538360596e-05, -2.92360782623291e-05, -2.2046267986297607e-05, -1.4856457710266113e-05, -7.666647434234619e-06, -4.76837158203125e-07, 6.712973117828369e-06, 1.3902783393859863e-05, 2.1092593669891357e-05, 2.828240394592285e-05, 3.5472214221954346e-05, 4.266202449798584e-05, 4.9851834774017334e-05, 5.704164505004883e-05, 6.423145532608032e-05, 7.142126560211182e-05, 7.861107587814331e-05, 8.58008861541748e-05, 9.29906964302063e-05, 0.00010018050670623779, 0.00010737031698226929, 0.00011456012725830078, 0.00012174993753433228, 0.00012893974781036377, 0.00013612955808639526, 0.00014331936836242676, 0.00015050917863845825, 0.00015769898891448975, 0.00016488879919052124, 0.00017207860946655273, 0.00017926841974258423, 0.00018645823001861572, 0.00019364804029464722, 0.0002008378505706787, 0.0002080276608467102, 0.0002152174711227417, 0.0002224072813987732, 0.0002295970916748047]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 5.0, 2.0, 1.0, 5.0, 14.0, 16.0, 20.0, 37.0, 61.0, 97.0, 154.0, 313.0, 703.0, 2061.0, 6825.0, 31663.0, 205864.0, 621071.0, 147388.0, 23938.0, 5387.0, 1696.0, 631.0, 268.0, 136.0, 84.0, 41.0, 23.0, 15.0, 11.0, 14.0, 7.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.46327972412109375, -0.4485321044921875, -0.43378448486328125, -0.419036865234375, -0.40428924560546875, -0.3895416259765625, -0.37479400634765625, -0.36004638671875, -0.34529876708984375, -0.3305511474609375, -0.31580352783203125, -0.301055908203125, -0.28630828857421875, -0.2715606689453125, -0.25681304931640625, -0.2420654296875, -0.22731781005859375, -0.2125701904296875, -0.19782257080078125, -0.183074951171875, -0.16832733154296875, -0.1535797119140625, -0.13883209228515625, -0.12408447265625, -0.10933685302734375, -0.0945892333984375, -0.07984161376953125, -0.065093994140625, -0.05034637451171875, -0.0355987548828125, -0.02085113525390625, -0.006103515625, 0.00864410400390625, 0.0233917236328125, 0.03813934326171875, 0.052886962890625, 0.06763458251953125, 0.0823822021484375, 0.09712982177734375, 0.11187744140625, 0.12662506103515625, 0.1413726806640625, 0.15612030029296875, 0.170867919921875, 0.18561553955078125, 0.2003631591796875, 0.21511077880859375, 0.2298583984375, 0.24460601806640625, 0.2593536376953125, 0.27410125732421875, 0.288848876953125, 0.30359649658203125, 0.3183441162109375, 0.33309173583984375, 0.34783935546875, 0.36258697509765625, 0.3773345947265625, 0.39208221435546875, 0.406829833984375, 0.42157745361328125, 0.4363250732421875, 0.45107269287109375, 0.4658203125]}, "gradients/decoder.model.decoder.layers.5.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 5.0, 6.0, 16.0, 17.0, 23.0, 32.0, 47.0, 62.0, 102.0, 100.0, 110.0, 97.0, 98.0, 83.0, 58.0, 43.0, 28.0, 16.0, 12.0, 12.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13916015625, -0.13446807861328125, -0.1297760009765625, -0.12508392333984375, -0.120391845703125, -0.11569976806640625, -0.1110076904296875, -0.10631561279296875, -0.10162353515625, -0.09693145751953125, -0.0922393798828125, -0.08754730224609375, -0.082855224609375, -0.07816314697265625, -0.0734710693359375, -0.06877899169921875, -0.0640869140625, -0.05939483642578125, -0.0547027587890625, -0.05001068115234375, -0.045318603515625, -0.04062652587890625, -0.0359344482421875, -0.03124237060546875, -0.02655029296875, -0.02185821533203125, -0.0171661376953125, -0.01247406005859375, -0.007781982421875, -0.00308990478515625, 0.0016021728515625, 0.00629425048828125, 0.010986328125, 0.01567840576171875, 0.0203704833984375, 0.02506256103515625, 0.029754638671875, 0.03444671630859375, 0.0391387939453125, 0.04383087158203125, 0.04852294921875, 0.05321502685546875, 0.0579071044921875, 0.06259918212890625, 0.067291259765625, 0.07198333740234375, 0.0766754150390625, 0.08136749267578125, 0.0860595703125, 0.09075164794921875, 0.0954437255859375, 0.10013580322265625, 0.104827880859375, 0.10951995849609375, 0.1142120361328125, 0.11890411376953125, 0.12359619140625, 0.12828826904296875, 0.1329803466796875, 0.13767242431640625, 0.142364501953125, 0.14705657958984375, 0.1517486572265625, 0.15644073486328125, 0.1611328125]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 12.0, 10.0, 34.0, 120.0, 215.0, 301.0, 199.0, 92.0, 23.0, 6.0, 5.0], "bins": [-76.26402282714844, -74.95537567138672, -73.646728515625, -72.33808135986328, -71.02943420410156, -69.72077941894531, -68.4121322631836, -67.10348510742188, -65.79483795166016, -64.48619079589844, -63.17754364013672, -61.868892669677734, -60.560245513916016, -59.2515983581543, -57.94294738769531, -56.634300231933594, -55.325653076171875, -54.017005920410156, -52.70835876464844, -51.39970779418945, -50.091060638427734, -48.782413482666016, -47.47376251220703, -46.16511535644531, -44.856468200683594, -43.547821044921875, -42.239173889160156, -40.93052291870117, -39.62187576293945, -38.313228607177734, -37.00457763671875, -35.69593048095703, -34.38728332519531, -33.078636169433594, -31.769987106323242, -30.46133804321289, -29.152690887451172, -27.844043731689453, -26.5353946685791, -25.22674560546875, -23.91809844970703, -22.609451293945312, -21.30080223083496, -19.99215316772461, -18.68350601196289, -17.374858856201172, -16.06620979309082, -14.757561683654785, -13.448912620544434, -12.140264511108398, -10.831616401672363, -9.522968292236328, -8.214320182800293, -6.905672073364258, -5.597023963928223, -4.2883758544921875, -2.9797277450561523, -1.6710796356201172, -0.36243152618408203, 0.9462165832519531, 2.2548646926879883, 3.5635128021240234, 4.872160911560059, 6.180809020996094, 7.489457130432129]}, "gradients/decoder.model.decoder.layers.5.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 3.0, 12.0, 7.0, 5.0, 11.0, 16.0, 23.0, 27.0, 25.0, 22.0, 34.0, 36.0, 50.0, 46.0, 49.0, 56.0, 49.0, 58.0, 37.0, 38.0, 64.0, 40.0, 46.0, 36.0, 37.0, 22.0, 29.0, 24.0, 20.0, 15.0, 11.0, 13.0, 8.0, 6.0, 7.0, 5.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.320796012878418, -9.961040496826172, -9.60128402709961, -9.241528511047363, -8.881772994995117, -8.522017478942871, -8.162261962890625, -7.8025054931640625, -7.442749977111816, -7.08299446105957, -6.723238468170166, -6.363482475280762, -6.003726959228516, -5.6439714431762695, -5.284215450286865, -4.924459457397461, -4.564703941345215, -4.204948425292969, -3.8451924324035645, -3.4854366779327393, -3.125680923461914, -2.765925168991089, -2.4061694145202637, -2.0464136600494385, -1.6866579055786133, -1.326902151107788, -0.9671463966369629, -0.6073906421661377, -0.2476348876953125, 0.1121208667755127, 0.4718766212463379, 0.8316323757171631, 1.1913881301879883, 1.5511438846588135, 1.9108996391296387, 2.270655393600464, 2.630411148071289, 2.9901669025421143, 3.3499226570129395, 3.7096784114837646, 4.06943416595459, 4.429189682006836, 4.78894567489624, 5.1487016677856445, 5.508457183837891, 5.868212699890137, 6.227968692779541, 6.587724685668945, 6.947480201721191, 7.3072357177734375, 7.666991710662842, 8.026747703552246, 8.386503219604492, 8.746258735656738, 9.106014251708984, 9.465770721435547, 9.825526237487793, 10.185281753540039, 10.545038223266602, 10.904793739318848, 11.264549255371094, 11.62430477142334, 11.984060287475586, 12.343816757202148, 12.703572273254395]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 4.0, 3.0, 4.0, 14.0, 7.0, 12.0, 10.0, 15.0, 27.0, 29.0, 39.0, 67.0, 89.0, 142.0, 199.0, 337.0, 582.0, 1049.0, 1977.0, 3752.0, 7606.0, 15461.0, 33087.0, 72916.0, 161742.0, 281312.0, 243786.0, 121056.0, 54097.0, 24794.0, 11785.0, 5794.0, 3025.0, 1577.0, 850.0, 479.0, 279.0, 184.0, 110.0, 81.0, 48.0, 35.0, 25.0, 16.0, 18.0, 10.0, 5.0, 9.0, 7.0, 1.0, 5.0, 0.0, 2.0, 1.0, 2.0, 2.0], "bins": [-7.5, -7.2781982421875, -7.056396484375, -6.8345947265625, -6.61279296875, -6.3909912109375, -6.169189453125, -5.9473876953125, -5.7255859375, -5.5037841796875, -5.281982421875, -5.0601806640625, -4.83837890625, -4.6165771484375, -4.394775390625, -4.1729736328125, -3.951171875, -3.7293701171875, -3.507568359375, -3.2857666015625, -3.06396484375, -2.8421630859375, -2.620361328125, -2.3985595703125, -2.1767578125, -1.9549560546875, -1.733154296875, -1.5113525390625, -1.28955078125, -1.0677490234375, -0.845947265625, -0.6241455078125, -0.40234375, -0.1805419921875, 0.041259765625, 0.2630615234375, 0.48486328125, 0.7066650390625, 0.928466796875, 1.1502685546875, 1.3720703125, 1.5938720703125, 1.815673828125, 2.0374755859375, 2.25927734375, 2.4810791015625, 2.702880859375, 2.9246826171875, 3.146484375, 3.3682861328125, 3.590087890625, 3.8118896484375, 4.03369140625, 4.2554931640625, 4.477294921875, 4.6990966796875, 4.9208984375, 5.1427001953125, 5.364501953125, 5.5863037109375, 5.80810546875, 6.0299072265625, 6.251708984375, 6.4735107421875, 6.6953125]}, "gradients/decoder.model.decoder.layers.5.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 5.0, 4.0, 3.0, 3.0, 9.0, 9.0, 8.0, 14.0, 15.0, 20.0, 19.0, 31.0, 29.0, 41.0, 48.0, 41.0, 37.0, 43.0, 51.0, 48.0, 43.0, 36.0, 38.0, 47.0, 53.0, 42.0, 35.0, 30.0, 34.0, 26.0, 34.0, 20.0, 17.0, 8.0, 18.0, 13.0, 7.0, 6.0, 6.0, 3.0, 5.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.828125, -21.181396484375, -20.53466796875, -19.887939453125, -19.2412109375, -18.594482421875, -17.94775390625, -17.301025390625, -16.654296875, -16.007568359375, -15.36083984375, -14.714111328125, -14.0673828125, -13.420654296875, -12.77392578125, -12.127197265625, -11.48046875, -10.833740234375, -10.18701171875, -9.540283203125, -8.8935546875, -8.246826171875, -7.60009765625, -6.953369140625, -6.306640625, -5.659912109375, -5.01318359375, -4.366455078125, -3.7197265625, -3.072998046875, -2.42626953125, -1.779541015625, -1.1328125, -0.486083984375, 0.16064453125, 0.807373046875, 1.4541015625, 2.100830078125, 2.74755859375, 3.394287109375, 4.041015625, 4.687744140625, 5.33447265625, 5.981201171875, 6.6279296875, 7.274658203125, 7.92138671875, 8.568115234375, 9.21484375, 9.861572265625, 10.50830078125, 11.155029296875, 11.8017578125, 12.448486328125, 13.09521484375, 13.741943359375, 14.388671875, 15.035400390625, 15.68212890625, 16.328857421875, 16.9755859375, 17.622314453125, 18.26904296875, 18.915771484375, 19.5625]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 8.0, 6.0, 8.0, 5.0, 8.0, 9.0, 22.0, 25.0, 31.0, 31.0, 63.0, 62.0, 86.0, 140.0, 210.0, 395.0, 844.0, 6026.0, 123856.0, 829083.0, 81589.0, 4278.0, 743.0, 315.0, 222.0, 115.0, 88.0, 64.0, 59.0, 23.0, 26.0, 21.0, 11.0, 17.0, 14.0, 12.0, 6.0, 4.0, 8.0, 9.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.03125, -25.176025390625, -24.32080078125, -23.465576171875, -22.6103515625, -21.755126953125, -20.89990234375, -20.044677734375, -19.189453125, -18.334228515625, -17.47900390625, -16.623779296875, -15.7685546875, -14.913330078125, -14.05810546875, -13.202880859375, -12.34765625, -11.492431640625, -10.63720703125, -9.781982421875, -8.9267578125, -8.071533203125, -7.21630859375, -6.361083984375, -5.505859375, -4.650634765625, -3.79541015625, -2.940185546875, -2.0849609375, -1.229736328125, -0.37451171875, 0.480712890625, 1.3359375, 2.191162109375, 3.04638671875, 3.901611328125, 4.7568359375, 5.612060546875, 6.46728515625, 7.322509765625, 8.177734375, 9.032958984375, 9.88818359375, 10.743408203125, 11.5986328125, 12.453857421875, 13.30908203125, 14.164306640625, 15.01953125, 15.874755859375, 16.72998046875, 17.585205078125, 18.4404296875, 19.295654296875, 20.15087890625, 21.006103515625, 21.861328125, 22.716552734375, 23.57177734375, 24.427001953125, 25.2822265625, 26.137451171875, 26.99267578125, 27.847900390625, 28.703125]}, "gradients/decoder.model.decoder.layers.5.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 12.0, 5.0, 8.0, 13.0, 18.0, 21.0, 21.0, 18.0, 30.0, 24.0, 26.0, 34.0, 45.0, 42.0, 41.0, 59.0, 43.0, 49.0, 48.0, 44.0, 41.0, 45.0, 46.0, 34.0, 32.0, 30.0, 16.0, 31.0, 23.0, 18.0, 10.0, 18.0, 11.0, 4.0, 9.0, 5.0, 6.0, 3.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 2.0], "bins": [-30.203125, -29.376708984375, -28.55029296875, -27.723876953125, -26.8974609375, -26.071044921875, -25.24462890625, -24.418212890625, -23.591796875, -22.765380859375, -21.93896484375, -21.112548828125, -20.2861328125, -19.459716796875, -18.63330078125, -17.806884765625, -16.98046875, -16.154052734375, -15.32763671875, -14.501220703125, -13.6748046875, -12.848388671875, -12.02197265625, -11.195556640625, -10.369140625, -9.542724609375, -8.71630859375, -7.889892578125, -7.0634765625, -6.237060546875, -5.41064453125, -4.584228515625, -3.7578125, -2.931396484375, -2.10498046875, -1.278564453125, -0.4521484375, 0.374267578125, 1.20068359375, 2.027099609375, 2.853515625, 3.679931640625, 4.50634765625, 5.332763671875, 6.1591796875, 6.985595703125, 7.81201171875, 8.638427734375, 9.46484375, 10.291259765625, 11.11767578125, 11.944091796875, 12.7705078125, 13.596923828125, 14.42333984375, 15.249755859375, 16.076171875, 16.902587890625, 17.72900390625, 18.555419921875, 19.3818359375, 20.208251953125, 21.03466796875, 21.861083984375, 22.6875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 3.0, 4.0, 13.0, 12.0, 28.0, 41.0, 81.0, 215.0, 546.0, 1500.0, 4763.0, 51814.0, 945046.0, 37838.0, 4426.0, 1357.0, 498.0, 181.0, 77.0, 41.0, 20.0, 15.0, 14.0, 8.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.3984375, -10.9324951171875, -10.466552734375, -10.0006103515625, -9.53466796875, -9.0687255859375, -8.602783203125, -8.1368408203125, -7.6708984375, -7.2049560546875, -6.739013671875, -6.2730712890625, -5.80712890625, -5.3411865234375, -4.875244140625, -4.4093017578125, -3.943359375, -3.4774169921875, -3.011474609375, -2.5455322265625, -2.07958984375, -1.6136474609375, -1.147705078125, -0.6817626953125, -0.2158203125, 0.2501220703125, 0.716064453125, 1.1820068359375, 1.64794921875, 2.1138916015625, 2.579833984375, 3.0457763671875, 3.51171875, 3.9776611328125, 4.443603515625, 4.9095458984375, 5.37548828125, 5.8414306640625, 6.307373046875, 6.7733154296875, 7.2392578125, 7.7052001953125, 8.171142578125, 8.6370849609375, 9.10302734375, 9.5689697265625, 10.034912109375, 10.5008544921875, 10.966796875, 11.4327392578125, 11.898681640625, 12.3646240234375, 12.83056640625, 13.2965087890625, 13.762451171875, 14.2283935546875, 14.6943359375, 15.1602783203125, 15.626220703125, 16.0921630859375, 16.55810546875, 17.0240478515625, 17.489990234375, 17.9559326171875, 18.421875]}, "gradients/decoder.model.decoder.layers.5.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 9.0, 10.0, 21.0, 36.0, 71.0, 124.0, 176.0, 247.0, 154.0, 78.0, 43.0, 13.0, 6.0, 4.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016965866088867188, -0.0016341954469680786, -0.0015718042850494385, -0.0015094131231307983, -0.0014470219612121582, -0.001384630799293518, -0.001322239637374878, -0.0012598484754562378, -0.0011974573135375977, -0.0011350661516189575, -0.0010726749897003174, -0.0010102838277816772, -0.0009478926658630371, -0.000885501503944397, -0.0008231103420257568, -0.0007607191801071167, -0.0006983280181884766, -0.0006359368562698364, -0.0005735456943511963, -0.0005111545324325562, -0.000448763370513916, -0.0003863722085952759, -0.00032398104667663574, -0.0002615898847579956, -0.00019919872283935547, -0.00013680756092071533, -7.44163990020752e-05, -1.2025237083435059e-05, 5.036592483520508e-05, 0.00011275708675384521, 0.00017514824867248535, 0.0002375394105911255, 0.0002999305725097656, 0.00036232173442840576, 0.0004247128963470459, 0.00048710405826568604, 0.0005494952201843262, 0.0006118863821029663, 0.0006742775440216064, 0.0007366687059402466, 0.0007990598678588867, 0.0008614510297775269, 0.000923842191696167, 0.0009862333536148071, 0.0010486245155334473, 0.0011110156774520874, 0.0011734068393707275, 0.0012357980012893677, 0.0012981891632080078, 0.001360580325126648, 0.001422971487045288, 0.0014853626489639282, 0.0015477538108825684, 0.0016101449728012085, 0.0016725361347198486, 0.0017349272966384888, 0.001797318458557129, 0.001859709620475769, 0.0019221007823944092, 0.0019844919443130493, 0.0020468831062316895, 0.0021092742681503296, 0.0021716654300689697, 0.00223405659198761, 0.00229644775390625]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 12.0, 12.0, 18.0, 23.0, 46.0, 82.0, 179.0, 454.0, 1190.0, 3929.0, 48256.0, 941677.0, 46758.0, 3900.0, 1157.0, 442.0, 183.0, 107.0, 41.0, 37.0, 26.0, 12.0, 9.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.859375, -11.375244140625, -10.89111328125, -10.406982421875, -9.9228515625, -9.438720703125, -8.95458984375, -8.470458984375, -7.986328125, -7.502197265625, -7.01806640625, -6.533935546875, -6.0498046875, -5.565673828125, -5.08154296875, -4.597412109375, -4.11328125, -3.629150390625, -3.14501953125, -2.660888671875, -2.1767578125, -1.692626953125, -1.20849609375, -0.724365234375, -0.240234375, 0.243896484375, 0.72802734375, 1.212158203125, 1.6962890625, 2.180419921875, 2.66455078125, 3.148681640625, 3.6328125, 4.116943359375, 4.60107421875, 5.085205078125, 5.5693359375, 6.053466796875, 6.53759765625, 7.021728515625, 7.505859375, 7.989990234375, 8.47412109375, 8.958251953125, 9.4423828125, 9.926513671875, 10.41064453125, 10.894775390625, 11.37890625, 11.863037109375, 12.34716796875, 12.831298828125, 13.3154296875, 13.799560546875, 14.28369140625, 14.767822265625, 15.251953125, 15.736083984375, 16.22021484375, 16.704345703125, 17.1884765625, 17.672607421875, 18.15673828125, 18.640869140625, 19.125]}, "gradients/decoder.model.decoder.layers.5.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 8.0, 7.0, 10.0, 21.0, 14.0, 35.0, 31.0, 48.0, 64.0, 73.0, 90.0, 91.0, 110.0, 93.0, 71.0, 55.0, 43.0, 46.0, 23.0, 21.0, 11.0, 16.0, 9.0, 4.0, 1.0, 6.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.42578125, -3.3467559814453125, -3.267730712890625, -3.1887054443359375, -3.10968017578125, -3.0306549072265625, -2.951629638671875, -2.8726043701171875, -2.7935791015625, -2.7145538330078125, -2.635528564453125, -2.5565032958984375, -2.47747802734375, -2.3984527587890625, -2.319427490234375, -2.2404022216796875, -2.161376953125, -2.0823516845703125, -2.003326416015625, -1.9243011474609375, -1.84527587890625, -1.7662506103515625, -1.687225341796875, -1.6082000732421875, -1.5291748046875, -1.4501495361328125, -1.371124267578125, -1.2920989990234375, -1.21307373046875, -1.1340484619140625, -1.055023193359375, -0.9759979248046875, -0.89697265625, -0.8179473876953125, -0.738922119140625, -0.6598968505859375, -0.58087158203125, -0.5018463134765625, -0.422821044921875, -0.3437957763671875, -0.2647705078125, -0.1857452392578125, -0.106719970703125, -0.0276947021484375, 0.05133056640625, 0.1303558349609375, 0.209381103515625, 0.2884063720703125, 0.367431640625, 0.4464569091796875, 0.525482177734375, 0.6045074462890625, 0.68353271484375, 0.7625579833984375, 0.841583251953125, 0.9206085205078125, 0.9996337890625, 1.0786590576171875, 1.157684326171875, 1.2367095947265625, 1.31573486328125, 1.3947601318359375, 1.473785400390625, 1.5528106689453125, 1.6318359375]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 3.0, 8.0, 7.0, 11.0, 20.0, 23.0, 35.0, 46.0, 62.0, 92.0, 103.0, 104.0, 117.0, 93.0, 78.0, 68.0, 41.0, 30.0, 30.0, 15.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.54375648498535, -26.541545867919922, -25.539337158203125, -24.537128448486328, -23.5349178314209, -22.53270721435547, -21.530498504638672, -20.528289794921875, -19.526079177856445, -18.523868560791016, -17.52165985107422, -16.519451141357422, -15.517240524291992, -14.515030860900879, -13.512821197509766, -12.510611534118652, -11.508401870727539, -10.506192207336426, -9.503982543945312, -8.5017728805542, -7.499563217163086, -6.497353553771973, -5.495143890380859, -4.492934226989746, -3.490724563598633, -2.4885149002075195, -1.4863052368164062, -0.48409557342529297, 0.5181140899658203, 1.5203237533569336, 2.522533416748047, 3.52474308013916, 4.526950836181641, 5.529160499572754, 6.531370162963867, 7.5335798263549805, 8.535789489746094, 9.537999153137207, 10.54020881652832, 11.542418479919434, 12.544628143310547, 13.54683780670166, 14.549047470092773, 15.551257133483887, 16.553466796875, 17.555675506591797, 18.557886123657227, 19.560096740722656, 20.562305450439453, 21.56451416015625, 22.56672477722168, 23.56893539428711, 24.571144104003906, 25.573352813720703, 26.575563430786133, 27.577774047851562, 28.57998275756836, 29.582191467285156, 30.584402084350586, 31.586612701416016, 32.58882141113281, 33.59103012084961, 34.593238830566406, 35.59545135498047, 36.597660064697266]}, "gradients/decoder.model.decoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 7.0, 5.0, 5.0, 13.0, 13.0, 4.0, 12.0, 13.0, 17.0, 12.0, 16.0, 13.0, 26.0, 21.0, 16.0, 24.0, 19.0, 34.0, 34.0, 31.0, 36.0, 38.0, 34.0, 24.0, 33.0, 37.0, 38.0, 24.0, 38.0, 30.0, 37.0, 35.0, 30.0, 27.0, 22.0, 25.0, 21.0, 11.0, 19.0, 18.0, 12.0, 11.0, 16.0, 8.0, 12.0, 4.0, 6.0, 8.0, 5.0, 5.0, 2.0, 4.0, 1.0, 1.0, 1.0, 3.0], "bins": [-38.047576904296875, -36.88070297241211, -35.713829040527344, -34.54695129394531, -33.38007736206055, -32.21320343017578, -31.046327590942383, -29.879451751708984, -28.71257781982422, -27.545703887939453, -26.378828048706055, -25.211952209472656, -24.04507827758789, -22.878204345703125, -21.711328506469727, -20.544452667236328, -19.377578735351562, -18.210704803466797, -17.0438289642334, -15.876954078674316, -14.710079193115234, -13.543204307556152, -12.37632942199707, -11.209454536437988, -10.042579650878906, -8.875704765319824, -7.708829879760742, -6.54195499420166, -5.375080108642578, -4.208205223083496, -3.041330337524414, -1.874455451965332, -0.7075843811035156, 0.4592905044555664, 1.6261653900146484, 2.7930402755737305, 3.9599151611328125, 5.1267900466918945, 6.293664932250977, 7.460539817810059, 8.62741470336914, 9.794289588928223, 10.961164474487305, 12.128039360046387, 13.294914245605469, 14.46178913116455, 15.628664016723633, 16.79553985595703, 17.962413787841797, 19.129287719726562, 20.29616355895996, 21.46303939819336, 22.629913330078125, 23.79678726196289, 24.96366310119629, 26.130538940429688, 27.297412872314453, 28.46428680419922, 29.631162643432617, 30.798038482666016, 31.96491241455078, 33.13178634643555, 34.29866027832031, 35.465538024902344, 36.63241195678711]}, "gradients/decoder.model.decoder.layers.4.fc2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 9.0, 12.0, 16.0, 13.0, 17.0, 36.0, 34.0, 44.0, 69.0, 86.0, 169.0, 248.0, 511.0, 1042.0, 4263.0, 53261.0, 1455016.0, 2551952.0, 118090.0, 6924.0, 1299.0, 466.0, 249.0, 151.0, 78.0, 73.0, 36.0, 23.0, 25.0, 21.0, 12.0, 9.0, 12.0, 9.0, 6.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.53125, -27.5517578125, -26.572265625, -25.5927734375, -24.61328125, -23.6337890625, -22.654296875, -21.6748046875, -20.6953125, -19.7158203125, -18.736328125, -17.7568359375, -16.77734375, -15.7978515625, -14.818359375, -13.8388671875, -12.859375, -11.8798828125, -10.900390625, -9.9208984375, -8.94140625, -7.9619140625, -6.982421875, -6.0029296875, -5.0234375, -4.0439453125, -3.064453125, -2.0849609375, -1.10546875, -0.1259765625, 0.853515625, 1.8330078125, 2.8125, 3.7919921875, 4.771484375, 5.7509765625, 6.73046875, 7.7099609375, 8.689453125, 9.6689453125, 10.6484375, 11.6279296875, 12.607421875, 13.5869140625, 14.56640625, 15.5458984375, 16.525390625, 17.5048828125, 18.484375, 19.4638671875, 20.443359375, 21.4228515625, 22.40234375, 23.3818359375, 24.361328125, 25.3408203125, 26.3203125, 27.2998046875, 28.279296875, 29.2587890625, 30.23828125, 31.2177734375, 32.197265625, 33.1767578125, 34.15625]}, "gradients/decoder.model.decoder.layers.4.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 8.0, 6.0, 7.0, 12.0, 19.0, 29.0, 36.0, 36.0, 34.0, 58.0, 48.0, 46.0, 69.0, 65.0, 57.0, 56.0, 65.0, 49.0, 45.0, 51.0, 33.0, 36.0, 26.0, 22.0, 25.0, 19.0, 12.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.953125, -13.40478515625, -12.8564453125, -12.30810546875, -11.759765625, -11.21142578125, -10.6630859375, -10.11474609375, -9.56640625, -9.01806640625, -8.4697265625, -7.92138671875, -7.373046875, -6.82470703125, -6.2763671875, -5.72802734375, -5.1796875, -4.63134765625, -4.0830078125, -3.53466796875, -2.986328125, -2.43798828125, -1.8896484375, -1.34130859375, -0.79296875, -0.24462890625, 0.3037109375, 0.85205078125, 1.400390625, 1.94873046875, 2.4970703125, 3.04541015625, 3.59375, 4.14208984375, 4.6904296875, 5.23876953125, 5.787109375, 6.33544921875, 6.8837890625, 7.43212890625, 7.98046875, 8.52880859375, 9.0771484375, 9.62548828125, 10.173828125, 10.72216796875, 11.2705078125, 11.81884765625, 12.3671875, 12.91552734375, 13.4638671875, 14.01220703125, 14.560546875, 15.10888671875, 15.6572265625, 16.20556640625, 16.75390625, 17.30224609375, 17.8505859375, 18.39892578125, 18.947265625, 19.49560546875, 20.0439453125, 20.59228515625, 21.140625]}, "gradients/decoder.model.decoder.layers.4.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 9.0, 6.0, 13.0, 20.0, 28.0, 37.0, 65.0, 75.0, 169.0, 211.0, 416.0, 936.0, 2196.0, 7599.0, 47396.0, 777284.0, 3095435.0, 234088.0, 20750.0, 4473.0, 1506.0, 715.0, 325.0, 215.0, 113.0, 67.0, 44.0, 28.0, 17.0, 13.0, 7.0, 8.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.984375, -18.313720703125, -17.64306640625, -16.972412109375, -16.3017578125, -15.631103515625, -14.96044921875, -14.289794921875, -13.619140625, -12.948486328125, -12.27783203125, -11.607177734375, -10.9365234375, -10.265869140625, -9.59521484375, -8.924560546875, -8.25390625, -7.583251953125, -6.91259765625, -6.241943359375, -5.5712890625, -4.900634765625, -4.22998046875, -3.559326171875, -2.888671875, -2.218017578125, -1.54736328125, -0.876708984375, -0.2060546875, 0.464599609375, 1.13525390625, 1.805908203125, 2.4765625, 3.147216796875, 3.81787109375, 4.488525390625, 5.1591796875, 5.829833984375, 6.50048828125, 7.171142578125, 7.841796875, 8.512451171875, 9.18310546875, 9.853759765625, 10.5244140625, 11.195068359375, 11.86572265625, 12.536376953125, 13.20703125, 13.877685546875, 14.54833984375, 15.218994140625, 15.8896484375, 16.560302734375, 17.23095703125, 17.901611328125, 18.572265625, 19.242919921875, 19.91357421875, 20.584228515625, 21.2548828125, 21.925537109375, 22.59619140625, 23.266845703125, 23.9375]}, "gradients/decoder.model.decoder.layers.4.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 3.0, 10.0, 14.0, 21.0, 29.0, 31.0, 42.0, 44.0, 78.0, 114.0, 140.0, 198.0, 298.0, 323.0, 443.0, 470.0, 444.0, 345.0, 274.0, 202.0, 165.0, 94.0, 76.0, 52.0, 32.0, 38.0, 21.0, 11.0, 9.0, 11.0, 10.0, 7.0, 6.0, 2.0, 3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.53515625, -4.3814697265625, -4.227783203125, -4.0740966796875, -3.92041015625, -3.7667236328125, -3.613037109375, -3.4593505859375, -3.3056640625, -3.1519775390625, -2.998291015625, -2.8446044921875, -2.69091796875, -2.5372314453125, -2.383544921875, -2.2298583984375, -2.076171875, -1.9224853515625, -1.768798828125, -1.6151123046875, -1.46142578125, -1.3077392578125, -1.154052734375, -1.0003662109375, -0.8466796875, -0.6929931640625, -0.539306640625, -0.3856201171875, -0.23193359375, -0.0782470703125, 0.075439453125, 0.2291259765625, 0.3828125, 0.5364990234375, 0.690185546875, 0.8438720703125, 0.99755859375, 1.1512451171875, 1.304931640625, 1.4586181640625, 1.6123046875, 1.7659912109375, 1.919677734375, 2.0733642578125, 2.22705078125, 2.3807373046875, 2.534423828125, 2.6881103515625, 2.841796875, 2.9954833984375, 3.149169921875, 3.3028564453125, 3.45654296875, 3.6102294921875, 3.763916015625, 3.9176025390625, 4.0712890625, 4.2249755859375, 4.378662109375, 4.5323486328125, 4.68603515625, 4.8397216796875, 4.993408203125, 5.1470947265625, 5.30078125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 12.0, 10.0, 9.0, 15.0, 22.0, 26.0, 32.0, 50.0, 61.0, 70.0, 63.0, 63.0, 76.0, 80.0, 81.0, 73.0, 55.0, 45.0, 37.0, 38.0, 25.0, 19.0, 17.0, 6.0, 6.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-26.240989685058594, -25.665014266967773, -25.08903694152832, -24.5130615234375, -23.93708610534668, -23.36111068725586, -22.785133361816406, -22.209157943725586, -21.633182525634766, -21.057207107543945, -20.481229782104492, -19.905254364013672, -19.32927894592285, -18.75330352783203, -18.177326202392578, -17.601350784301758, -17.025373458862305, -16.449398040771484, -15.873421669006348, -15.297445297241211, -14.72146987915039, -14.145493507385254, -13.569517135620117, -12.993541717529297, -12.41756534576416, -11.841588973999023, -11.265613555908203, -10.689637184143066, -10.11366081237793, -9.53768539428711, -8.961709022521973, -8.385732650756836, -7.809755325317383, -7.233779430389404, -6.657803535461426, -6.081827163696289, -5.5058512687683105, -4.929875373840332, -4.353899002075195, -3.777923107147217, -3.2019472122192383, -2.6259713172912598, -2.049995183944702, -1.474019169807434, -0.898043155670166, -0.3220672607421875, 0.2539088726043701, 0.8298850059509277, 1.4058609008789062, 1.9818369150161743, 2.5578129291534424, 3.1337890625, 3.7097649574279785, 4.285740852355957, 4.861717224121094, 5.437693119049072, 6.013669013977051, 6.589644908905029, 7.165620803833008, 7.7415971755981445, 8.317573547363281, 8.893548965454102, 9.469525337219238, 10.045501708984375, 10.621477127075195]}, "gradients/decoder.model.decoder.layers.4.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 6.0, 9.0, 9.0, 11.0, 8.0, 10.0, 9.0, 22.0, 23.0, 23.0, 26.0, 26.0, 29.0, 28.0, 34.0, 39.0, 34.0, 50.0, 50.0, 41.0, 57.0, 33.0, 41.0, 41.0, 40.0, 44.0, 38.0, 33.0, 21.0, 24.0, 31.0, 16.0, 10.0, 15.0, 19.0, 14.0, 7.0, 8.0, 6.0, 4.0, 8.0, 5.0, 4.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.958385467529297, -13.52048397064209, -13.082582473754883, -12.644680976867676, -12.206779479980469, -11.768877983093262, -11.330976486206055, -10.893074035644531, -10.45517349243164, -10.017271995544434, -9.579370498657227, -9.14146900177002, -8.703567504882812, -8.265666007995605, -7.82776403427124, -7.389862537384033, -6.951960563659668, -6.514059066772461, -6.076157569885254, -5.638256072998047, -5.20035457611084, -4.762453079223633, -4.324551105499268, -3.8866496086120605, -3.4487481117248535, -3.0108466148376465, -2.5729451179504395, -2.1350433826446533, -1.6971418857574463, -1.2592403888702393, -0.8213386535644531, -0.3834371566772461, 0.05446434020996094, 0.49236589670181274, 0.9302674531936646, 1.3681690692901611, 1.8060705661773682, 2.243972063064575, 2.6818737983703613, 3.1197752952575684, 3.5576767921447754, 3.9955782890319824, 4.4334797859191895, 4.871381759643555, 5.309283256530762, 5.747184753417969, 6.185086250305176, 6.622987747192383, 7.06088924407959, 7.498790740966797, 7.936692237854004, 8.374593734741211, 8.812495231628418, 9.250396728515625, 9.688299179077148, 10.126199722290039, 10.564102172851562, 11.00200366973877, 11.439905166625977, 11.877806663513184, 12.31570816040039, 12.753609657287598, 13.191511154174805, 13.629413604736328, 14.067314147949219]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 5.0, 16.0, 13.0, 26.0, 31.0, 46.0, 57.0, 78.0, 135.0, 235.0, 344.0, 694.0, 1349.0, 2713.0, 6278.0, 15339.0, 38332.0, 100372.0, 228850.0, 314305.0, 200052.0, 83663.0, 32548.0, 12675.0, 5314.0, 2383.0, 1212.0, 562.0, 331.0, 197.0, 123.0, 83.0, 39.0, 47.0, 29.0, 19.0, 19.0, 11.0, 4.0, 5.0, 9.0, 1.0, 4.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.24609375, -2.169708251953125, -2.09332275390625, -2.016937255859375, -1.9405517578125, -1.864166259765625, -1.78778076171875, -1.711395263671875, -1.635009765625, -1.558624267578125, -1.48223876953125, -1.405853271484375, -1.3294677734375, -1.253082275390625, -1.17669677734375, -1.100311279296875, -1.02392578125, -0.947540283203125, -0.87115478515625, -0.794769287109375, -0.7183837890625, -0.641998291015625, -0.56561279296875, -0.489227294921875, -0.412841796875, -0.336456298828125, -0.26007080078125, -0.183685302734375, -0.1072998046875, -0.030914306640625, 0.04547119140625, 0.121856689453125, 0.1982421875, 0.274627685546875, 0.35101318359375, 0.427398681640625, 0.5037841796875, 0.580169677734375, 0.65655517578125, 0.732940673828125, 0.809326171875, 0.885711669921875, 0.96209716796875, 1.038482666015625, 1.1148681640625, 1.191253662109375, 1.26763916015625, 1.344024658203125, 1.42041015625, 1.496795654296875, 1.57318115234375, 1.649566650390625, 1.7259521484375, 1.802337646484375, 1.87872314453125, 1.955108642578125, 2.031494140625, 2.107879638671875, 2.18426513671875, 2.260650634765625, 2.3370361328125, 2.413421630859375, 2.48980712890625, 2.566192626953125, 2.642578125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 7.0, 8.0, 15.0, 14.0, 10.0, 7.0, 27.0, 27.0, 28.0, 21.0, 23.0, 38.0, 26.0, 45.0, 40.0, 45.0, 39.0, 57.0, 51.0, 41.0, 45.0, 49.0, 43.0, 31.0, 23.0, 32.0, 31.0, 32.0, 13.0, 26.0, 22.0, 12.0, 9.0, 11.0, 13.0, 9.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.4466552734375, -9.127685546875, -8.8087158203125, -8.48974609375, -8.1707763671875, -7.851806640625, -7.5328369140625, -7.2138671875, -6.8948974609375, -6.575927734375, -6.2569580078125, -5.93798828125, -5.6190185546875, -5.300048828125, -4.9810791015625, -4.662109375, -4.3431396484375, -4.024169921875, -3.7052001953125, -3.38623046875, -3.0672607421875, -2.748291015625, -2.4293212890625, -2.1103515625, -1.7913818359375, -1.472412109375, -1.1534423828125, -0.83447265625, -0.5155029296875, -0.196533203125, 0.1224365234375, 0.44140625, 0.7603759765625, 1.079345703125, 1.3983154296875, 1.71728515625, 2.0362548828125, 2.355224609375, 2.6741943359375, 2.9931640625, 3.3121337890625, 3.631103515625, 3.9500732421875, 4.26904296875, 4.5880126953125, 4.906982421875, 5.2259521484375, 5.544921875, 5.8638916015625, 6.182861328125, 6.5018310546875, 6.82080078125, 7.1397705078125, 7.458740234375, 7.7777099609375, 8.0966796875, 8.4156494140625, 8.734619140625, 9.0535888671875, 9.37255859375, 9.6915283203125, 10.010498046875, 10.3294677734375, 10.6484375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 9.0, 10.0, 21.0, 20.0, 25.0, 55.0, 77.0, 115.0, 191.0, 289.0, 433.0, 752.0, 1369.0, 2178.0, 3953.0, 7067.0, 12445.0, 22347.0, 40178.0, 71066.0, 117516.0, 170072.0, 191945.0, 158525.0, 105685.0, 62611.0, 35132.0, 19486.0, 10774.0, 6000.0, 3434.0, 1925.0, 1142.0, 649.0, 377.0, 244.0, 155.0, 108.0, 63.0, 31.0, 25.0, 23.0, 11.0, 14.0, 5.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-1.1982421875, -1.157470703125, -1.11669921875, -1.075927734375, -1.03515625, -0.994384765625, -0.95361328125, -0.912841796875, -0.8720703125, -0.831298828125, -0.79052734375, -0.749755859375, -0.708984375, -0.668212890625, -0.62744140625, -0.586669921875, -0.5458984375, -0.505126953125, -0.46435546875, -0.423583984375, -0.3828125, -0.342041015625, -0.30126953125, -0.260498046875, -0.2197265625, -0.178955078125, -0.13818359375, -0.097412109375, -0.056640625, -0.015869140625, 0.02490234375, 0.065673828125, 0.1064453125, 0.147216796875, 0.18798828125, 0.228759765625, 0.26953125, 0.310302734375, 0.35107421875, 0.391845703125, 0.4326171875, 0.473388671875, 0.51416015625, 0.554931640625, 0.595703125, 0.636474609375, 0.67724609375, 0.718017578125, 0.7587890625, 0.799560546875, 0.84033203125, 0.881103515625, 0.921875, 0.962646484375, 1.00341796875, 1.044189453125, 1.0849609375, 1.125732421875, 1.16650390625, 1.207275390625, 1.248046875, 1.288818359375, 1.32958984375, 1.370361328125, 1.4111328125]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 4.0, 5.0, 8.0, 7.0, 9.0, 14.0, 8.0, 8.0, 13.0, 9.0, 23.0, 27.0, 17.0, 31.0, 36.0, 37.0, 27.0, 35.0, 38.0, 38.0, 41.0, 46.0, 46.0, 41.0, 43.0, 43.0, 44.0, 47.0, 40.0, 32.0, 24.0, 15.0, 19.0, 30.0, 21.0, 14.0, 14.0, 12.0, 8.0, 5.0, 6.0, 1.0, 3.0, 1.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.140625, -19.500244140625, -18.85986328125, -18.219482421875, -17.5791015625, -16.938720703125, -16.29833984375, -15.657958984375, -15.017578125, -14.377197265625, -13.73681640625, -13.096435546875, -12.4560546875, -11.815673828125, -11.17529296875, -10.534912109375, -9.89453125, -9.254150390625, -8.61376953125, -7.973388671875, -7.3330078125, -6.692626953125, -6.05224609375, -5.411865234375, -4.771484375, -4.131103515625, -3.49072265625, -2.850341796875, -2.2099609375, -1.569580078125, -0.92919921875, -0.288818359375, 0.3515625, 0.991943359375, 1.63232421875, 2.272705078125, 2.9130859375, 3.553466796875, 4.19384765625, 4.834228515625, 5.474609375, 6.114990234375, 6.75537109375, 7.395751953125, 8.0361328125, 8.676513671875, 9.31689453125, 9.957275390625, 10.59765625, 11.238037109375, 11.87841796875, 12.518798828125, 13.1591796875, 13.799560546875, 14.43994140625, 15.080322265625, 15.720703125, 16.361083984375, 17.00146484375, 17.641845703125, 18.2822265625, 18.922607421875, 19.56298828125, 20.203369140625, 20.84375]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 4.0, 5.0, 8.0, 11.0, 11.0, 14.0, 16.0, 31.0, 54.0, 79.0, 111.0, 195.0, 376.0, 570.0, 1357.0, 2846.0, 7313.0, 25506.0, 131027.0, 521962.0, 285560.0, 51505.0, 12104.0, 4081.0, 1810.0, 881.0, 459.0, 252.0, 140.0, 91.0, 54.0, 34.0, 34.0, 20.0, 12.0, 8.0, 4.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3837890625, -0.37042999267578125, -0.3570709228515625, -0.34371185302734375, -0.330352783203125, -0.31699371337890625, -0.3036346435546875, -0.29027557373046875, -0.27691650390625, -0.26355743408203125, -0.2501983642578125, -0.23683929443359375, -0.223480224609375, -0.21012115478515625, -0.1967620849609375, -0.18340301513671875, -0.1700439453125, -0.15668487548828125, -0.1433258056640625, -0.12996673583984375, -0.116607666015625, -0.10324859619140625, -0.0898895263671875, -0.07653045654296875, -0.06317138671875, -0.04981231689453125, -0.0364532470703125, -0.02309417724609375, -0.009735107421875, 0.00362396240234375, 0.0169830322265625, 0.03034210205078125, 0.043701171875, 0.05706024169921875, 0.0704193115234375, 0.08377838134765625, 0.097137451171875, 0.11049652099609375, 0.1238555908203125, 0.13721466064453125, 0.15057373046875, 0.16393280029296875, 0.1772918701171875, 0.19065093994140625, 0.204010009765625, 0.21736907958984375, 0.2307281494140625, 0.24408721923828125, 0.2574462890625, 0.27080535888671875, 0.2841644287109375, 0.29752349853515625, 0.310882568359375, 0.32424163818359375, 0.3376007080078125, 0.35095977783203125, 0.36431884765625, 0.37767791748046875, 0.3910369873046875, 0.40439605712890625, 0.417755126953125, 0.43111419677734375, 0.4444732666015625, 0.45783233642578125, 0.47119140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 5.0, 4.0, 1.0, 7.0, 7.0, 15.0, 31.0, 28.0, 38.0, 65.0, 85.0, 80.0, 105.0, 98.0, 86.0, 82.0, 77.0, 41.0, 41.0, 42.0, 31.0, 12.0, 10.0, 8.0, 2.0, 3.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002865791320800781, -0.00027925893664360046, -0.0002719387412071228, -0.00026461854577064514, -0.0002572983503341675, -0.0002499781548976898, -0.00024265795946121216, -0.0002353377640247345, -0.00022801756858825684, -0.00022069737315177917, -0.00021337717771530151, -0.00020605698227882385, -0.0001987367868423462, -0.00019141659140586853, -0.00018409639596939087, -0.0001767762005329132, -0.00016945600509643555, -0.00016213580965995789, -0.00015481561422348022, -0.00014749541878700256, -0.0001401752233505249, -0.00013285502791404724, -0.00012553483247756958, -0.00011821463704109192, -0.00011089444160461426, -0.0001035742461681366, -9.625405073165894e-05, -8.893385529518127e-05, -8.161365985870361e-05, -7.429346442222595e-05, -6.697326898574829e-05, -5.965307354927063e-05, -5.233287811279297e-05, -4.501268267631531e-05, -3.7692487239837646e-05, -3.0372291803359985e-05, -2.3052096366882324e-05, -1.5731900930404663e-05, -8.411705493927002e-06, -1.0915100574493408e-06, 6.22868537902832e-06, 1.3548880815505981e-05, 2.0869076251983643e-05, 2.8189271688461304e-05, 3.5509467124938965e-05, 4.2829662561416626e-05, 5.014985799789429e-05, 5.747005343437195e-05, 6.479024887084961e-05, 7.211044430732727e-05, 7.943063974380493e-05, 8.675083518028259e-05, 9.407103061676025e-05, 0.00010139122605323792, 0.00010871142148971558, 0.00011603161692619324, 0.0001233518123626709, 0.00013067200779914856, 0.00013799220323562622, 0.00014531239867210388, 0.00015263259410858154, 0.0001599527895450592, 0.00016727298498153687, 0.00017459318041801453, 0.0001819133758544922]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 8.0, 9.0, 17.0, 42.0, 75.0, 135.0, 352.0, 1039.0, 4864.0, 49478.0, 675808.0, 295754.0, 17510.0, 2383.0, 578.0, 259.0, 103.0, 63.0, 27.0, 12.0, 10.0, 10.0, 4.0, 3.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.626678466796875, -0.60491943359375, -0.583160400390625, -0.5614013671875, -0.539642333984375, -0.51788330078125, -0.496124267578125, -0.474365234375, -0.452606201171875, -0.43084716796875, -0.409088134765625, -0.3873291015625, -0.365570068359375, -0.34381103515625, -0.322052001953125, -0.30029296875, -0.278533935546875, -0.25677490234375, -0.235015869140625, -0.2132568359375, -0.191497802734375, -0.16973876953125, -0.147979736328125, -0.126220703125, -0.104461669921875, -0.08270263671875, -0.060943603515625, -0.0391845703125, -0.017425537109375, 0.00433349609375, 0.026092529296875, 0.0478515625, 0.069610595703125, 0.09136962890625, 0.113128662109375, 0.1348876953125, 0.156646728515625, 0.17840576171875, 0.200164794921875, 0.221923828125, 0.243682861328125, 0.26544189453125, 0.287200927734375, 0.3089599609375, 0.330718994140625, 0.35247802734375, 0.374237060546875, 0.39599609375, 0.417755126953125, 0.43951416015625, 0.461273193359375, 0.4830322265625, 0.504791259765625, 0.52655029296875, 0.548309326171875, 0.570068359375, 0.591827392578125, 0.61358642578125, 0.635345458984375, 0.6571044921875, 0.678863525390625, 0.70062255859375, 0.722381591796875, 0.744140625]}, "gradients/decoder.model.decoder.layers.4.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 6.0, 5.0, 6.0, 8.0, 13.0, 16.0, 15.0, 26.0, 44.0, 58.0, 88.0, 84.0, 104.0, 109.0, 116.0, 77.0, 81.0, 39.0, 23.0, 23.0, 10.0, 11.0, 7.0, 10.0, 10.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10797119140625, -0.10327816009521484, -0.09858512878417969, -0.09389209747314453, -0.08919906616210938, -0.08450603485107422, -0.07981300354003906, -0.0751199722290039, -0.07042694091796875, -0.0657339096069336, -0.06104087829589844, -0.05634784698486328, -0.051654815673828125, -0.04696178436279297, -0.04226875305175781, -0.037575721740722656, -0.0328826904296875, -0.028189659118652344, -0.023496627807617188, -0.01880359649658203, -0.014110565185546875, -0.009417533874511719, -0.0047245025634765625, -3.147125244140625e-05, 0.00466156005859375, 0.009354591369628906, 0.014047622680664062, 0.01874065399169922, 0.023433685302734375, 0.02812671661376953, 0.03281974792480469, 0.037512779235839844, 0.042205810546875, 0.046898841857910156, 0.05159187316894531, 0.05628490447998047, 0.060977935791015625, 0.06567096710205078, 0.07036399841308594, 0.0750570297241211, 0.07975006103515625, 0.0844430923461914, 0.08913612365722656, 0.09382915496826172, 0.09852218627929688, 0.10321521759033203, 0.10790824890136719, 0.11260128021240234, 0.1172943115234375, 0.12198734283447266, 0.1266803741455078, 0.13137340545654297, 0.13606643676757812, 0.14075946807861328, 0.14545249938964844, 0.1501455307006836, 0.15483856201171875, 0.1595315933227539, 0.16422462463378906, 0.16891765594482422, 0.17361068725585938, 0.17830371856689453, 0.1829967498779297, 0.18768978118896484, 0.1923828125]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 10.0, 20.0, 40.0, 79.0, 144.0, 173.0, 191.0, 159.0, 101.0, 53.0, 25.0, 6.0, 4.0, 2.0], "bins": [-49.311859130859375, -48.43227005004883, -47.55268096923828, -46.673095703125, -45.79350662231445, -44.913917541503906, -44.03432846069336, -43.15473937988281, -42.275150299072266, -41.39556121826172, -40.51597213745117, -39.636383056640625, -38.756797790527344, -37.8772087097168, -36.99761962890625, -36.1180305480957, -35.238441467285156, -34.35885238647461, -33.47926330566406, -32.59967803955078, -31.7200870513916, -30.840499877929688, -29.96091079711914, -29.081321716308594, -28.201736450195312, -27.322147369384766, -26.44256019592285, -25.562971115112305, -24.683382034301758, -23.803794860839844, -22.924205780029297, -22.04461669921875, -21.165027618408203, -20.285438537597656, -19.405851364135742, -18.526262283325195, -17.64667320251465, -16.767086029052734, -15.887496948242188, -15.00790786743164, -14.128320693969727, -13.248732566833496, -12.36914348602295, -11.489555358886719, -10.609966278076172, -9.730378150939941, -8.850790023803711, -7.971201419830322, -7.091612815856934, -6.212024211883545, -5.332435607910156, -4.452847480773926, -3.573258876800537, -2.6936702728271484, -1.814082145690918, -0.9344935417175293, -0.054904937744140625, 0.8246835470199585, 1.7042720317840576, 2.583860397338867, 3.463449001312256, 4.3430376052856445, 5.222625732421875, 6.102214336395264, 6.981802940368652]}, "gradients/decoder.model.decoder.layers.4.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 9.0, 14.0, 5.0, 15.0, 10.0, 23.0, 23.0, 22.0, 26.0, 35.0, 26.0, 35.0, 47.0, 38.0, 43.0, 52.0, 56.0, 46.0, 42.0, 46.0, 45.0, 43.0, 38.0, 39.0, 36.0, 27.0, 28.0, 16.0, 16.0, 17.0, 16.0, 13.0, 11.0, 9.0, 7.0, 4.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-10.501741409301758, -10.179980278015137, -9.8582181930542, -9.536457061767578, -9.214695930480957, -8.892934799194336, -8.571172714233398, -8.249411582946777, -7.927650451660156, -7.605888843536377, -7.284127712249756, -6.962366104125977, -6.6406049728393555, -6.318843364715576, -5.997081756591797, -5.675320625305176, -5.3535590171813965, -5.031797409057617, -4.710036277770996, -4.388274669647217, -4.066513538360596, -3.7447519302368164, -3.422990560531616, -3.101229190826416, -2.779467821121216, -2.4577064514160156, -2.1359450817108154, -1.8141835927963257, -1.4924222230911255, -1.1706608533859253, -0.8488993644714355, -0.5271379947662354, -0.20537662506103516, 0.11638477444648743, 0.43814617395401, 0.759907603263855, 1.0816689729690552, 1.4034303426742554, 1.7251918315887451, 2.0469532012939453, 2.3687145709991455, 2.6904759407043457, 3.012237310409546, 3.333998680114746, 3.6557602882385254, 3.9775214195251465, 4.299283027648926, 4.621044158935547, 4.942805767059326, 5.2645673751831055, 5.586328506469727, 5.908090114593506, 6.229851245880127, 6.551612854003906, 6.873373985290527, 7.195135593414307, 7.516897201538086, 7.838658809661865, 8.160420417785645, 8.482181549072266, 8.803942680358887, 9.125703811645508, 9.447465896606445, 9.769227027893066, 10.090988159179688]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 8.0, 4.0, 10.0, 12.0, 15.0, 32.0, 55.0, 69.0, 125.0, 223.0, 463.0, 894.0, 1959.0, 4569.0, 11797.0, 34316.0, 111711.0, 339443.0, 360587.0, 123081.0, 37459.0, 12718.0, 4836.0, 2070.0, 999.0, 501.0, 234.0, 129.0, 84.0, 40.0, 24.0, 26.0, 18.0, 4.0, 7.0, 0.0, 7.0, 3.0, 2.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-11.1875, -10.8770751953125, -10.566650390625, -10.2562255859375, -9.94580078125, -9.6353759765625, -9.324951171875, -9.0145263671875, -8.7041015625, -8.3936767578125, -8.083251953125, -7.7728271484375, -7.46240234375, -7.1519775390625, -6.841552734375, -6.5311279296875, -6.220703125, -5.9102783203125, -5.599853515625, -5.2894287109375, -4.97900390625, -4.6685791015625, -4.358154296875, -4.0477294921875, -3.7373046875, -3.4268798828125, -3.116455078125, -2.8060302734375, -2.49560546875, -2.1851806640625, -1.874755859375, -1.5643310546875, -1.25390625, -0.9434814453125, -0.633056640625, -0.3226318359375, -0.01220703125, 0.2982177734375, 0.608642578125, 0.9190673828125, 1.2294921875, 1.5399169921875, 1.850341796875, 2.1607666015625, 2.47119140625, 2.7816162109375, 3.092041015625, 3.4024658203125, 3.712890625, 4.0233154296875, 4.333740234375, 4.6441650390625, 4.95458984375, 5.2650146484375, 5.575439453125, 5.8858642578125, 6.1962890625, 6.5067138671875, 6.817138671875, 7.1275634765625, 7.43798828125, 7.7484130859375, 8.058837890625, 8.3692626953125, 8.6796875]}, "gradients/decoder.model.decoder.layers.4.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 4.0, 10.0, 10.0, 8.0, 8.0, 10.0, 22.0, 13.0, 17.0, 22.0, 25.0, 29.0, 32.0, 22.0, 24.0, 36.0, 41.0, 30.0, 39.0, 51.0, 48.0, 40.0, 43.0, 41.0, 39.0, 45.0, 30.0, 37.0, 18.0, 19.0, 30.0, 18.0, 15.0, 20.0, 14.0, 16.0, 13.0, 17.0, 7.0, 9.0, 1.0, 2.0, 10.0, 1.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-16.03125, -15.513427734375, -14.99560546875, -14.477783203125, -13.9599609375, -13.442138671875, -12.92431640625, -12.406494140625, -11.888671875, -11.370849609375, -10.85302734375, -10.335205078125, -9.8173828125, -9.299560546875, -8.78173828125, -8.263916015625, -7.74609375, -7.228271484375, -6.71044921875, -6.192626953125, -5.6748046875, -5.156982421875, -4.63916015625, -4.121337890625, -3.603515625, -3.085693359375, -2.56787109375, -2.050048828125, -1.5322265625, -1.014404296875, -0.49658203125, 0.021240234375, 0.5390625, 1.056884765625, 1.57470703125, 2.092529296875, 2.6103515625, 3.128173828125, 3.64599609375, 4.163818359375, 4.681640625, 5.199462890625, 5.71728515625, 6.235107421875, 6.7529296875, 7.270751953125, 7.78857421875, 8.306396484375, 8.82421875, 9.342041015625, 9.85986328125, 10.377685546875, 10.8955078125, 11.413330078125, 11.93115234375, 12.448974609375, 12.966796875, 13.484619140625, 14.00244140625, 14.520263671875, 15.0380859375, 15.555908203125, 16.07373046875, 16.591552734375, 17.109375]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 7.0, 3.0, 13.0, 13.0, 12.0, 18.0, 32.0, 33.0, 53.0, 55.0, 86.0, 93.0, 159.0, 200.0, 326.0, 750.0, 2979.0, 37988.0, 697257.0, 292380.0, 13019.0, 1573.0, 527.0, 257.0, 203.0, 130.0, 85.0, 70.0, 44.0, 34.0, 27.0, 27.0, 24.0, 21.0, 14.0, 9.0, 7.0, 7.0, 4.0, 3.0, 3.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.265625, -21.518798828125, -20.77197265625, -20.025146484375, -19.2783203125, -18.531494140625, -17.78466796875, -17.037841796875, -16.291015625, -15.544189453125, -14.79736328125, -14.050537109375, -13.3037109375, -12.556884765625, -11.81005859375, -11.063232421875, -10.31640625, -9.569580078125, -8.82275390625, -8.075927734375, -7.3291015625, -6.582275390625, -5.83544921875, -5.088623046875, -4.341796875, -3.594970703125, -2.84814453125, -2.101318359375, -1.3544921875, -0.607666015625, 0.13916015625, 0.885986328125, 1.6328125, 2.379638671875, 3.12646484375, 3.873291015625, 4.6201171875, 5.366943359375, 6.11376953125, 6.860595703125, 7.607421875, 8.354248046875, 9.10107421875, 9.847900390625, 10.5947265625, 11.341552734375, 12.08837890625, 12.835205078125, 13.58203125, 14.328857421875, 15.07568359375, 15.822509765625, 16.5693359375, 17.316162109375, 18.06298828125, 18.809814453125, 19.556640625, 20.303466796875, 21.05029296875, 21.797119140625, 22.5439453125, 23.290771484375, 24.03759765625, 24.784423828125, 25.53125]}, "gradients/decoder.model.decoder.layers.4.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 6.0, 6.0, 4.0, 8.0, 5.0, 7.0, 8.0, 14.0, 22.0, 21.0, 20.0, 25.0, 21.0, 32.0, 32.0, 36.0, 45.0, 41.0, 34.0, 52.0, 39.0, 51.0, 49.0, 47.0, 36.0, 48.0, 40.0, 33.0, 42.0, 28.0, 30.0, 22.0, 16.0, 18.0, 14.0, 11.0, 10.0, 9.0, 2.0, 4.0, 5.0, 4.0, 2.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.5625, -19.82080078125, -19.0791015625, -18.33740234375, -17.595703125, -16.85400390625, -16.1123046875, -15.37060546875, -14.62890625, -13.88720703125, -13.1455078125, -12.40380859375, -11.662109375, -10.92041015625, -10.1787109375, -9.43701171875, -8.6953125, -7.95361328125, -7.2119140625, -6.47021484375, -5.728515625, -4.98681640625, -4.2451171875, -3.50341796875, -2.76171875, -2.02001953125, -1.2783203125, -0.53662109375, 0.205078125, 0.94677734375, 1.6884765625, 2.43017578125, 3.171875, 3.91357421875, 4.6552734375, 5.39697265625, 6.138671875, 6.88037109375, 7.6220703125, 8.36376953125, 9.10546875, 9.84716796875, 10.5888671875, 11.33056640625, 12.072265625, 12.81396484375, 13.5556640625, 14.29736328125, 15.0390625, 15.78076171875, 16.5224609375, 17.26416015625, 18.005859375, 18.74755859375, 19.4892578125, 20.23095703125, 20.97265625, 21.71435546875, 22.4560546875, 23.19775390625, 23.939453125, 24.68115234375, 25.4228515625, 26.16455078125, 26.90625]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 0.0, 10.0, 4.0, 21.0, 61.0, 221.0, 831.0, 4623.0, 468357.0, 568333.0, 4924.0, 848.0, 198.0, 57.0, 36.0, 15.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-23.765625, -23.105712890625, -22.44580078125, -21.785888671875, -21.1259765625, -20.466064453125, -19.80615234375, -19.146240234375, -18.486328125, -17.826416015625, -17.16650390625, -16.506591796875, -15.8466796875, -15.186767578125, -14.52685546875, -13.866943359375, -13.20703125, -12.547119140625, -11.88720703125, -11.227294921875, -10.5673828125, -9.907470703125, -9.24755859375, -8.587646484375, -7.927734375, -7.267822265625, -6.60791015625, -5.947998046875, -5.2880859375, -4.628173828125, -3.96826171875, -3.308349609375, -2.6484375, -1.988525390625, -1.32861328125, -0.668701171875, -0.0087890625, 0.651123046875, 1.31103515625, 1.970947265625, 2.630859375, 3.290771484375, 3.95068359375, 4.610595703125, 5.2705078125, 5.930419921875, 6.59033203125, 7.250244140625, 7.91015625, 8.570068359375, 9.22998046875, 9.889892578125, 10.5498046875, 11.209716796875, 11.86962890625, 12.529541015625, 13.189453125, 13.849365234375, 14.50927734375, 15.169189453125, 15.8291015625, 16.489013671875, 17.14892578125, 17.808837890625, 18.46875]}, "gradients/decoder.model.decoder.layers.4.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 30.0, 41.0, 77.0, 133.0, 205.0, 187.0, 125.0, 83.0, 35.0, 32.0, 17.0, 6.0, 7.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015211105346679688, -0.0014666169881820679, -0.001412123441696167, -0.0013576298952102661, -0.0013031363487243652, -0.0012486428022384644, -0.0011941492557525635, -0.0011396557092666626, -0.0010851621627807617, -0.0010306686162948608, -0.00097617506980896, -0.0009216815233230591, -0.0008671879768371582, -0.0008126944303512573, -0.0007582008838653564, -0.0007037073373794556, -0.0006492137908935547, -0.0005947202444076538, -0.0005402266979217529, -0.00048573315143585205, -0.00043123960494995117, -0.0003767460584640503, -0.0003222525119781494, -0.00026775896549224854, -0.00021326541900634766, -0.00015877187252044678, -0.0001042783260345459, -4.978477954864502e-05, 4.708766937255859e-06, 5.920231342315674e-05, 0.00011369585990905762, 0.0001681894063949585, 0.00022268295288085938, 0.00027717649936676025, 0.00033167004585266113, 0.000386163592338562, 0.0004406571388244629, 0.0004951506853103638, 0.0005496442317962646, 0.0006041377782821655, 0.0006586313247680664, 0.0007131248712539673, 0.0007676184177398682, 0.000822111964225769, 0.0008766055107116699, 0.0009310990571975708, 0.0009855926036834717, 0.0010400861501693726, 0.0010945796966552734, 0.0011490732431411743, 0.0012035667896270752, 0.001258060336112976, 0.001312553882598877, 0.0013670474290847778, 0.0014215409755706787, 0.0014760345220565796, 0.0015305280685424805, 0.0015850216150283813, 0.0016395151615142822, 0.001694008708000183, 0.001748502254486084, 0.0018029958009719849, 0.0018574893474578857, 0.0019119828939437866, 0.0019664764404296875]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 7.0, 16.0, 20.0, 63.0, 125.0, 342.0, 943.0, 4846.0, 350227.0, 683944.0, 6256.0, 1114.0, 360.0, 165.0, 60.0, 28.0, 12.0, 11.0, 10.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.3125, -20.721435546875, -20.13037109375, -19.539306640625, -18.9482421875, -18.357177734375, -17.76611328125, -17.175048828125, -16.583984375, -15.992919921875, -15.40185546875, -14.810791015625, -14.2197265625, -13.628662109375, -13.03759765625, -12.446533203125, -11.85546875, -11.264404296875, -10.67333984375, -10.082275390625, -9.4912109375, -8.900146484375, -8.30908203125, -7.718017578125, -7.126953125, -6.535888671875, -5.94482421875, -5.353759765625, -4.7626953125, -4.171630859375, -3.58056640625, -2.989501953125, -2.3984375, -1.807373046875, -1.21630859375, -0.625244140625, -0.0341796875, 0.556884765625, 1.14794921875, 1.739013671875, 2.330078125, 2.921142578125, 3.51220703125, 4.103271484375, 4.6943359375, 5.285400390625, 5.87646484375, 6.467529296875, 7.05859375, 7.649658203125, 8.24072265625, 8.831787109375, 9.4228515625, 10.013916015625, 10.60498046875, 11.196044921875, 11.787109375, 12.378173828125, 12.96923828125, 13.560302734375, 14.1513671875, 14.742431640625, 15.33349609375, 15.924560546875, 16.515625]}, "gradients/decoder.model.decoder.layers.4.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 6.0, 11.0, 8.0, 20.0, 28.0, 50.0, 66.0, 74.0, 127.0, 154.0, 134.0, 111.0, 71.0, 44.0, 25.0, 26.0, 27.0, 11.0, 10.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.12890625, -4.040435791015625, -3.95196533203125, -3.863494873046875, -3.7750244140625, -3.686553955078125, -3.59808349609375, -3.509613037109375, -3.421142578125, -3.332672119140625, -3.24420166015625, -3.155731201171875, -3.0672607421875, -2.978790283203125, -2.89031982421875, -2.801849365234375, -2.71337890625, -2.624908447265625, -2.53643798828125, -2.447967529296875, -2.3594970703125, -2.271026611328125, -2.18255615234375, -2.094085693359375, -2.005615234375, -1.917144775390625, -1.82867431640625, -1.740203857421875, -1.6517333984375, -1.563262939453125, -1.47479248046875, -1.386322021484375, -1.2978515625, -1.209381103515625, -1.12091064453125, -1.032440185546875, -0.9439697265625, -0.855499267578125, -0.76702880859375, -0.678558349609375, -0.590087890625, -0.501617431640625, -0.41314697265625, -0.324676513671875, -0.2362060546875, -0.147735595703125, -0.05926513671875, 0.029205322265625, 0.11767578125, 0.206146240234375, 0.29461669921875, 0.383087158203125, 0.4715576171875, 0.560028076171875, 0.64849853515625, 0.736968994140625, 0.825439453125, 0.913909912109375, 1.00238037109375, 1.090850830078125, 1.1793212890625, 1.267791748046875, 1.35626220703125, 1.444732666015625, 1.533203125]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 5.0, 5.0, 16.0, 15.0, 31.0, 76.0, 106.0, 119.0, 141.0, 155.0, 121.0, 83.0, 53.0, 46.0, 21.0, 10.0, 5.0, 1.0, 2.0], "bins": [-69.99202728271484, -68.69107818603516, -67.39013671875, -66.08918762207031, -64.78823852539062, -63.4872932434082, -62.186344146728516, -60.885398864746094, -59.584449768066406, -58.283504486083984, -56.9825553894043, -55.681610107421875, -54.38066101074219, -53.079715728759766, -51.77876663208008, -50.477821350097656, -49.17687225341797, -47.87592697143555, -46.57497787475586, -45.27403259277344, -43.97308349609375, -42.67213821411133, -41.37118911743164, -40.07024383544922, -38.7692985534668, -37.468353271484375, -36.16740417480469, -34.866458892822266, -33.56550979614258, -32.264564514160156, -30.96361541748047, -29.662670135498047, -28.361717224121094, -27.06077003479004, -25.759822845458984, -24.45887565612793, -23.157928466796875, -21.85698127746582, -20.556034088134766, -19.255088806152344, -17.95414161682129, -16.653194427490234, -15.35224723815918, -14.051300048828125, -12.75035285949707, -11.449405670166016, -10.148459434509277, -8.847512245178223, -7.546565055847168, -6.245617866516113, -4.944670677185059, -3.643723964691162, -2.3427767753601074, -1.0418295860290527, 0.25911712646484375, 1.5600643157958984, 2.861011505126953, 4.161958694458008, 5.4629058837890625, 6.763852596282959, 8.064800262451172, 9.365747451782227, 10.666693687438965, 11.96764087677002, 13.268588066101074]}, "gradients/decoder.model.decoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 7.0, 6.0, 14.0, 8.0, 13.0, 16.0, 14.0, 18.0, 31.0, 26.0, 35.0, 26.0, 39.0, 27.0, 34.0, 32.0, 41.0, 41.0, 43.0, 37.0, 41.0, 51.0, 44.0, 31.0, 30.0, 35.0, 37.0, 32.0, 18.0, 18.0, 23.0, 19.0, 16.0, 14.0, 12.0, 7.0, 10.0, 18.0, 6.0, 4.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.292678833007812, -29.193513870239258, -28.094350814819336, -26.99518585205078, -25.89602279663086, -24.796857833862305, -23.69769287109375, -22.598529815673828, -21.499364852905273, -20.40019989013672, -19.301036834716797, -18.201871871948242, -17.102706909179688, -16.003543853759766, -14.904378890991211, -13.805214881896973, -12.706050872802734, -11.606886863708496, -10.507722854614258, -9.408557891845703, -8.309393882751465, -7.210229873657227, -6.11106538772583, -5.011900901794434, -3.9127368927001953, -2.813572645187378, -1.7144083976745605, -0.6152441501617432, 0.4839200973510742, 1.5830841064453125, 2.682248592376709, 3.7814130783081055, 4.880577087402344, 5.979741096496582, 7.0789055824279785, 8.178070068359375, 9.277234077453613, 10.376398086547852, 11.475563049316406, 12.574727058410645, 13.673891067504883, 14.773055076599121, 15.87221908569336, 16.971384048461914, 18.07054901123047, 19.16971206665039, 20.268877029418945, 21.3680419921875, 22.467205047607422, 23.566370010375977, 24.6655330657959, 25.764698028564453, 26.863861083984375, 27.96302604675293, 29.062191009521484, 30.161354064941406, 31.26051902770996, 32.359683990478516, 33.45884704589844, 34.55801010131836, 35.65717697143555, 36.75634002685547, 37.85550308227539, 38.95466995239258, 40.0538330078125]}, "gradients/decoder.model.decoder.layers.3.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 6.0, 1.0, 11.0, 5.0, 16.0, 19.0, 31.0, 39.0, 57.0, 75.0, 83.0, 114.0, 168.0, 264.0, 388.0, 675.0, 1947.0, 8474.0, 67543.0, 879684.0, 2792088.0, 400611.0, 33293.0, 5412.0, 1470.0, 598.0, 343.0, 229.0, 173.0, 127.0, 90.0, 73.0, 48.0, 36.0, 22.0, 18.0, 13.0, 13.0, 12.0, 0.0, 1.0, 11.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-22.9375, -22.228515625, -21.51953125, -20.810546875, -20.1015625, -19.392578125, -18.68359375, -17.974609375, -17.265625, -16.556640625, -15.84765625, -15.138671875, -14.4296875, -13.720703125, -13.01171875, -12.302734375, -11.59375, -10.884765625, -10.17578125, -9.466796875, -8.7578125, -8.048828125, -7.33984375, -6.630859375, -5.921875, -5.212890625, -4.50390625, -3.794921875, -3.0859375, -2.376953125, -1.66796875, -0.958984375, -0.25, 0.458984375, 1.16796875, 1.876953125, 2.5859375, 3.294921875, 4.00390625, 4.712890625, 5.421875, 6.130859375, 6.83984375, 7.548828125, 8.2578125, 8.966796875, 9.67578125, 10.384765625, 11.09375, 11.802734375, 12.51171875, 13.220703125, 13.9296875, 14.638671875, 15.34765625, 16.056640625, 16.765625, 17.474609375, 18.18359375, 18.892578125, 19.6015625, 20.310546875, 21.01953125, 21.728515625, 22.4375]}, "gradients/decoder.model.decoder.layers.3.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 5.0, 7.0, 16.0, 6.0, 15.0, 21.0, 20.0, 25.0, 13.0, 45.0, 23.0, 37.0, 50.0, 46.0, 45.0, 51.0, 66.0, 56.0, 52.0, 53.0, 54.0, 31.0, 39.0, 25.0, 41.0, 26.0, 14.0, 14.0, 17.0, 17.0, 17.0, 14.0, 4.0, 9.0, 7.0, 4.0, 9.0, 3.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.2734375, -10.901123046875, -10.52880859375, -10.156494140625, -9.7841796875, -9.411865234375, -9.03955078125, -8.667236328125, -8.294921875, -7.922607421875, -7.55029296875, -7.177978515625, -6.8056640625, -6.433349609375, -6.06103515625, -5.688720703125, -5.31640625, -4.944091796875, -4.57177734375, -4.199462890625, -3.8271484375, -3.454833984375, -3.08251953125, -2.710205078125, -2.337890625, -1.965576171875, -1.59326171875, -1.220947265625, -0.8486328125, -0.476318359375, -0.10400390625, 0.268310546875, 0.640625, 1.012939453125, 1.38525390625, 1.757568359375, 2.1298828125, 2.502197265625, 2.87451171875, 3.246826171875, 3.619140625, 3.991455078125, 4.36376953125, 4.736083984375, 5.1083984375, 5.480712890625, 5.85302734375, 6.225341796875, 6.59765625, 6.969970703125, 7.34228515625, 7.714599609375, 8.0869140625, 8.459228515625, 8.83154296875, 9.203857421875, 9.576171875, 9.948486328125, 10.32080078125, 10.693115234375, 11.0654296875, 11.437744140625, 11.81005859375, 12.182373046875, 12.5546875]}, "gradients/decoder.model.decoder.layers.3.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 3.0, 13.0, 5.0, 16.0, 31.0, 41.0, 79.0, 106.0, 200.0, 367.0, 773.0, 1805.0, 6117.0, 42761.0, 1144533.0, 2873118.0, 108950.0, 10502.0, 2680.0, 1069.0, 496.0, 244.0, 144.0, 81.0, 56.0, 26.0, 19.0, 14.0, 12.0, 2.0, 2.0, 5.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.40625, -18.66455078125, -17.9228515625, -17.18115234375, -16.439453125, -15.69775390625, -14.9560546875, -14.21435546875, -13.47265625, -12.73095703125, -11.9892578125, -11.24755859375, -10.505859375, -9.76416015625, -9.0224609375, -8.28076171875, -7.5390625, -6.79736328125, -6.0556640625, -5.31396484375, -4.572265625, -3.83056640625, -3.0888671875, -2.34716796875, -1.60546875, -0.86376953125, -0.1220703125, 0.61962890625, 1.361328125, 2.10302734375, 2.8447265625, 3.58642578125, 4.328125, 5.06982421875, 5.8115234375, 6.55322265625, 7.294921875, 8.03662109375, 8.7783203125, 9.52001953125, 10.26171875, 11.00341796875, 11.7451171875, 12.48681640625, 13.228515625, 13.97021484375, 14.7119140625, 15.45361328125, 16.1953125, 16.93701171875, 17.6787109375, 18.42041015625, 19.162109375, 19.90380859375, 20.6455078125, 21.38720703125, 22.12890625, 22.87060546875, 23.6123046875, 24.35400390625, 25.095703125, 25.83740234375, 26.5791015625, 27.32080078125, 28.0625]}, "gradients/decoder.model.decoder.layers.3.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 9.0, 10.0, 17.0, 21.0, 19.0, 25.0, 43.0, 50.0, 108.0, 145.0, 193.0, 267.0, 363.0, 415.0, 524.0, 485.0, 397.0, 297.0, 193.0, 137.0, 101.0, 84.0, 50.0, 32.0, 26.0, 14.0, 15.0, 8.0, 6.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-6.53125, -6.370391845703125, -6.20953369140625, -6.048675537109375, -5.8878173828125, -5.726959228515625, -5.56610107421875, -5.405242919921875, -5.244384765625, -5.083526611328125, -4.92266845703125, -4.761810302734375, -4.6009521484375, -4.440093994140625, -4.27923583984375, -4.118377685546875, -3.95751953125, -3.796661376953125, -3.63580322265625, -3.474945068359375, -3.3140869140625, -3.153228759765625, -2.99237060546875, -2.831512451171875, -2.670654296875, -2.509796142578125, -2.34893798828125, -2.188079833984375, -2.0272216796875, -1.866363525390625, -1.70550537109375, -1.544647216796875, -1.3837890625, -1.222930908203125, -1.06207275390625, -0.901214599609375, -0.7403564453125, -0.579498291015625, -0.41864013671875, -0.257781982421875, -0.096923828125, 0.063934326171875, 0.22479248046875, 0.385650634765625, 0.5465087890625, 0.707366943359375, 0.86822509765625, 1.029083251953125, 1.18994140625, 1.350799560546875, 1.51165771484375, 1.672515869140625, 1.8333740234375, 1.994232177734375, 2.15509033203125, 2.315948486328125, 2.476806640625, 2.637664794921875, 2.79852294921875, 2.959381103515625, 3.1202392578125, 3.281097412109375, 3.44195556640625, 3.602813720703125, 3.763671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 8.0, 15.0, 16.0, 20.0, 31.0, 36.0, 40.0, 71.0, 59.0, 62.0, 76.0, 85.0, 80.0, 66.0, 58.0, 64.0, 53.0, 39.0, 28.0, 24.0, 25.0, 12.0, 7.0, 4.0, 6.0, 3.0, 3.0, 3.0, 5.0, 1.0, 4.0], "bins": [-23.248619079589844, -22.72801399230957, -22.207408905029297, -21.68680191040039, -21.166196823120117, -20.645591735839844, -20.12498664855957, -19.604381561279297, -19.08377456665039, -18.563169479370117, -18.042564392089844, -17.521957397460938, -17.001352310180664, -16.48074722290039, -15.960142135620117, -15.439536094665527, -14.918931007385254, -14.39832592010498, -13.87771987915039, -13.357114791870117, -12.836508750915527, -12.315903663635254, -11.795297622680664, -11.27469253540039, -10.754087448120117, -10.233482360839844, -9.712876319885254, -9.19227123260498, -8.67166519165039, -8.151060104370117, -7.6304545402526855, -7.109848976135254, -6.589242935180664, -6.068637371063232, -5.548031806945801, -5.027426719665527, -4.5068206787109375, -3.986215353012085, -3.4656100273132324, -2.945004463195801, -2.424398899078369, -1.9037933349609375, -1.3831878900527954, -0.8625824451446533, -0.3419768810272217, 0.17862868309020996, 0.6992340087890625, 1.2198395729064941, 1.7404451370239258, 2.2610507011413574, 2.781656265258789, 3.3022615909576416, 3.8228671550750732, 4.343472480773926, 4.864078044891357, 5.384683609008789, 5.905289173126221, 6.425894737243652, 6.946500301361084, 7.467105865478516, 7.987710952758789, 8.508316993713379, 9.028922080993652, 9.549528121948242, 10.070133209228516]}, "gradients/decoder.model.decoder.layers.3.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 7.0, 6.0, 4.0, 12.0, 13.0, 14.0, 16.0, 23.0, 22.0, 21.0, 31.0, 31.0, 33.0, 35.0, 31.0, 28.0, 53.0, 32.0, 40.0, 52.0, 38.0, 35.0, 52.0, 24.0, 32.0, 36.0, 25.0, 27.0, 24.0, 33.0, 21.0, 24.0, 15.0, 17.0, 13.0, 16.0, 12.0, 5.0, 9.0, 7.0, 6.0, 2.0, 6.0, 5.0, 3.0, 2.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.425792694091797, -11.05117416381836, -10.676554679870605, -10.301935195922852, -9.927316665649414, -9.552698135375977, -9.178078651428223, -8.803459167480469, -8.428840637207031, -8.054222106933594, -7.67960262298584, -7.304983615875244, -6.930364608764648, -6.555745601654053, -6.181126594543457, -5.806507587432861, -5.431888580322266, -5.05726957321167, -4.682650566101074, -4.3080315589904785, -3.933412551879883, -3.558793544769287, -3.1841745376586914, -2.8095555305480957, -2.4349365234375, -2.0603175163269043, -1.6856985092163086, -1.311079502105713, -0.9364604949951172, -0.5618414878845215, -0.18722248077392578, 0.18739652633666992, 0.5620145797729492, 0.9366335868835449, 1.3112525939941406, 1.6858716011047363, 2.060490608215332, 2.4351096153259277, 2.8097286224365234, 3.184347629547119, 3.558966636657715, 3.9335856437683105, 4.308204650878906, 4.682823657989502, 5.057442665100098, 5.432061672210693, 5.806680679321289, 6.181299686431885, 6.5559186935424805, 6.930537700653076, 7.305156707763672, 7.679775714874268, 8.054394721984863, 8.429014205932617, 8.803632736206055, 9.178251266479492, 9.552870750427246, 9.927490234375, 10.302108764648438, 10.676727294921875, 11.051346778869629, 11.425966262817383, 11.80058479309082, 12.175203323364258, 12.549822807312012]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 16.0, 13.0, 38.0, 53.0, 76.0, 123.0, 195.0, 315.0, 668.0, 1360.0, 3166.0, 8126.0, 23396.0, 77029.0, 250183.0, 403729.0, 193361.0, 57680.0, 17725.0, 6293.0, 2508.0, 1136.0, 596.0, 315.0, 163.0, 93.0, 57.0, 45.0, 30.0, 16.0, 12.0, 12.0, 7.0, 6.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.337890625, -2.25250244140625, -2.1671142578125, -2.08172607421875, -1.996337890625, -1.91094970703125, -1.8255615234375, -1.74017333984375, -1.65478515625, -1.56939697265625, -1.4840087890625, -1.39862060546875, -1.313232421875, -1.22784423828125, -1.1424560546875, -1.05706787109375, -0.9716796875, -0.88629150390625, -0.8009033203125, -0.71551513671875, -0.630126953125, -0.54473876953125, -0.4593505859375, -0.37396240234375, -0.28857421875, -0.20318603515625, -0.1177978515625, -0.03240966796875, 0.052978515625, 0.13836669921875, 0.2237548828125, 0.30914306640625, 0.39453125, 0.47991943359375, 0.5653076171875, 0.65069580078125, 0.736083984375, 0.82147216796875, 0.9068603515625, 0.99224853515625, 1.07763671875, 1.16302490234375, 1.2484130859375, 1.33380126953125, 1.419189453125, 1.50457763671875, 1.5899658203125, 1.67535400390625, 1.7607421875, 1.84613037109375, 1.9315185546875, 2.01690673828125, 2.102294921875, 2.18768310546875, 2.2730712890625, 2.35845947265625, 2.44384765625, 2.52923583984375, 2.6146240234375, 2.70001220703125, 2.785400390625, 2.87078857421875, 2.9561767578125, 3.04156494140625, 3.126953125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 7.0, 13.0, 11.0, 18.0, 20.0, 27.0, 33.0, 35.0, 40.0, 56.0, 38.0, 45.0, 39.0, 59.0, 51.0, 49.0, 53.0, 58.0, 35.0, 38.0, 38.0, 25.0, 32.0, 30.0, 30.0, 31.0, 17.0, 11.0, 7.0, 10.0, 7.0, 9.0, 5.0, 1.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3671875, -8.056640625, -7.74609375, -7.435546875, -7.125, -6.814453125, -6.50390625, -6.193359375, -5.8828125, -5.572265625, -5.26171875, -4.951171875, -4.640625, -4.330078125, -4.01953125, -3.708984375, -3.3984375, -3.087890625, -2.77734375, -2.466796875, -2.15625, -1.845703125, -1.53515625, -1.224609375, -0.9140625, -0.603515625, -0.29296875, 0.017578125, 0.328125, 0.638671875, 0.94921875, 1.259765625, 1.5703125, 1.880859375, 2.19140625, 2.501953125, 2.8125, 3.123046875, 3.43359375, 3.744140625, 4.0546875, 4.365234375, 4.67578125, 4.986328125, 5.296875, 5.607421875, 5.91796875, 6.228515625, 6.5390625, 6.849609375, 7.16015625, 7.470703125, 7.78125, 8.091796875, 8.40234375, 8.712890625, 9.0234375, 9.333984375, 9.64453125, 9.955078125, 10.265625, 10.576171875, 10.88671875, 11.197265625, 11.5078125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 5.0, 7.0, 17.0, 24.0, 42.0, 47.0, 79.0, 124.0, 208.0, 360.0, 701.0, 1252.0, 2198.0, 4551.0, 9096.0, 19004.0, 39834.0, 83154.0, 158942.0, 238078.0, 222234.0, 136090.0, 68530.0, 32900.0, 15695.0, 7465.0, 3729.0, 1858.0, 989.0, 556.0, 304.0, 164.0, 140.0, 74.0, 32.0, 24.0, 17.0, 13.0, 6.0, 0.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.544921875, -1.503021240234375, -1.46112060546875, -1.419219970703125, -1.3773193359375, -1.335418701171875, -1.29351806640625, -1.251617431640625, -1.209716796875, -1.167816162109375, -1.12591552734375, -1.084014892578125, -1.0421142578125, -1.000213623046875, -0.95831298828125, -0.916412353515625, -0.87451171875, -0.832611083984375, -0.79071044921875, -0.748809814453125, -0.7069091796875, -0.665008544921875, -0.62310791015625, -0.581207275390625, -0.539306640625, -0.497406005859375, -0.45550537109375, -0.413604736328125, -0.3717041015625, -0.329803466796875, -0.28790283203125, -0.246002197265625, -0.2041015625, -0.162200927734375, -0.12030029296875, -0.078399658203125, -0.0364990234375, 0.005401611328125, 0.04730224609375, 0.089202880859375, 0.131103515625, 0.173004150390625, 0.21490478515625, 0.256805419921875, 0.2987060546875, 0.340606689453125, 0.38250732421875, 0.424407958984375, 0.46630859375, 0.508209228515625, 0.55010986328125, 0.592010498046875, 0.6339111328125, 0.675811767578125, 0.71771240234375, 0.759613037109375, 0.801513671875, 0.843414306640625, 0.88531494140625, 0.927215576171875, 0.9691162109375, 1.011016845703125, 1.05291748046875, 1.094818115234375, 1.13671875]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 13.0, 9.0, 12.0, 18.0, 21.0, 18.0, 26.0, 45.0, 42.0, 46.0, 40.0, 39.0, 52.0, 55.0, 60.0, 47.0, 47.0, 55.0, 48.0, 43.0, 49.0, 36.0, 25.0, 16.0, 20.0, 28.0, 20.0, 13.0, 9.0, 10.0, 6.0, 5.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-23.046875, -22.443603515625, -21.84033203125, -21.237060546875, -20.6337890625, -20.030517578125, -19.42724609375, -18.823974609375, -18.220703125, -17.617431640625, -17.01416015625, -16.410888671875, -15.8076171875, -15.204345703125, -14.60107421875, -13.997802734375, -13.39453125, -12.791259765625, -12.18798828125, -11.584716796875, -10.9814453125, -10.378173828125, -9.77490234375, -9.171630859375, -8.568359375, -7.965087890625, -7.36181640625, -6.758544921875, -6.1552734375, -5.552001953125, -4.94873046875, -4.345458984375, -3.7421875, -3.138916015625, -2.53564453125, -1.932373046875, -1.3291015625, -0.725830078125, -0.12255859375, 0.480712890625, 1.083984375, 1.687255859375, 2.29052734375, 2.893798828125, 3.4970703125, 4.100341796875, 4.70361328125, 5.306884765625, 5.91015625, 6.513427734375, 7.11669921875, 7.719970703125, 8.3232421875, 8.926513671875, 9.52978515625, 10.133056640625, 10.736328125, 11.339599609375, 11.94287109375, 12.546142578125, 13.1494140625, 13.752685546875, 14.35595703125, 14.959228515625, 15.5625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 14.0, 13.0, 8.0, 17.0, 26.0, 42.0, 63.0, 79.0, 98.0, 141.0, 226.0, 328.0, 492.0, 834.0, 1412.0, 2609.0, 5334.0, 11541.0, 27525.0, 71556.0, 182754.0, 334728.0, 241234.0, 100008.0, 37766.0, 15167.0, 6824.0, 3200.0, 1680.0, 983.0, 586.0, 356.0, 279.0, 193.0, 114.0, 91.0, 73.0, 47.0, 32.0, 30.0, 18.0, 11.0, 6.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0], "bins": [-0.2093505859375, -0.20348167419433594, -0.19761276245117188, -0.1917438507080078, -0.18587493896484375, -0.1800060272216797, -0.17413711547851562, -0.16826820373535156, -0.1623992919921875, -0.15653038024902344, -0.15066146850585938, -0.1447925567626953, -0.13892364501953125, -0.1330547332763672, -0.12718582153320312, -0.12131690979003906, -0.115447998046875, -0.10957908630371094, -0.10371017456054688, -0.09784126281738281, -0.09197235107421875, -0.08610343933105469, -0.08023452758789062, -0.07436561584472656, -0.0684967041015625, -0.06262779235839844, -0.056758880615234375, -0.05088996887207031, -0.04502105712890625, -0.03915214538574219, -0.033283233642578125, -0.027414321899414062, -0.02154541015625, -0.015676498413085938, -0.009807586669921875, -0.0039386749267578125, 0.00193023681640625, 0.0077991485595703125, 0.013668060302734375, 0.019536972045898438, 0.0254058837890625, 0.03127479553222656, 0.037143707275390625, 0.04301261901855469, 0.04888153076171875, 0.05475044250488281, 0.060619354248046875, 0.06648826599121094, 0.072357177734375, 0.07822608947753906, 0.08409500122070312, 0.08996391296386719, 0.09583282470703125, 0.10170173645019531, 0.10757064819335938, 0.11343955993652344, 0.1193084716796875, 0.12517738342285156, 0.13104629516601562, 0.1369152069091797, 0.14278411865234375, 0.1486530303955078, 0.15452194213867188, 0.16039085388183594, 0.166259765625]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 5.0, 5.0, 6.0, 18.0, 7.0, 21.0, 25.0, 27.0, 43.0, 50.0, 73.0, 78.0, 86.0, 105.0, 73.0, 73.0, 67.0, 51.0, 45.0, 30.0, 35.0, 17.0, 19.0, 12.0, 6.0, 6.0, 4.0, 9.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001710653305053711, -0.00016580335795879364, -0.0001605413854122162, -0.00015527941286563873, -0.00015001744031906128, -0.00014475546777248383, -0.00013949349522590637, -0.00013423152267932892, -0.00012896955013275146, -0.000123707577586174, -0.00011844560503959656, -0.0001131836324930191, -0.00010792165994644165, -0.0001026596873998642, -9.739771485328674e-05, -9.213574230670929e-05, -8.687376976013184e-05, -8.161179721355438e-05, -7.634982466697693e-05, -7.108785212039948e-05, -6.582587957382202e-05, -6.056390702724457e-05, -5.5301934480667114e-05, -5.003996193408966e-05, -4.477798938751221e-05, -3.9516016840934753e-05, -3.42540442943573e-05, -2.8992071747779846e-05, -2.3730099201202393e-05, -1.846812665462494e-05, -1.3206154108047485e-05, -7.944181561470032e-06, -2.682209014892578e-06, 2.5797635316848755e-06, 7.841736078262329e-06, 1.3103708624839783e-05, 1.8365681171417236e-05, 2.362765371799469e-05, 2.8889626264572144e-05, 3.41515988111496e-05, 3.941357135772705e-05, 4.4675543904304504e-05, 4.993751645088196e-05, 5.519948899745941e-05, 6.0461461544036865e-05, 6.572343409061432e-05, 7.098540663719177e-05, 7.624737918376923e-05, 8.150935173034668e-05, 8.677132427692413e-05, 9.203329682350159e-05, 9.729526937007904e-05, 0.0001025572419166565, 0.00010781921446323395, 0.0001130811870098114, 0.00011834315955638885, 0.0001236051321029663, 0.00012886710464954376, 0.00013412907719612122, 0.00013939104974269867, 0.00014465302228927612, 0.00014991499483585358, 0.00015517696738243103, 0.00016043893992900848, 0.00016570091247558594]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 12.0, 13.0, 11.0, 23.0, 44.0, 75.0, 137.0, 242.0, 454.0, 917.0, 2003.0, 5513.0, 18257.0, 80253.0, 389152.0, 427353.0, 93026.0, 20757.0, 5992.0, 2275.0, 1013.0, 448.0, 258.0, 129.0, 72.0, 38.0, 34.0, 15.0, 7.0, 4.0, 6.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31689453125, -0.3066864013671875, -0.296478271484375, -0.2862701416015625, -0.27606201171875, -0.2658538818359375, -0.255645751953125, -0.2454376220703125, -0.2352294921875, -0.2250213623046875, -0.214813232421875, -0.2046051025390625, -0.19439697265625, -0.1841888427734375, -0.173980712890625, -0.1637725830078125, -0.153564453125, -0.1433563232421875, -0.133148193359375, -0.1229400634765625, -0.11273193359375, -0.1025238037109375, -0.092315673828125, -0.0821075439453125, -0.0718994140625, -0.0616912841796875, -0.051483154296875, -0.0412750244140625, -0.03106689453125, -0.0208587646484375, -0.010650634765625, -0.0004425048828125, 0.009765625, 0.0199737548828125, 0.030181884765625, 0.0403900146484375, 0.05059814453125, 0.0608062744140625, 0.071014404296875, 0.0812225341796875, 0.0914306640625, 0.1016387939453125, 0.111846923828125, 0.1220550537109375, 0.13226318359375, 0.1424713134765625, 0.152679443359375, 0.1628875732421875, 0.173095703125, 0.1833038330078125, 0.193511962890625, 0.2037200927734375, 0.21392822265625, 0.2241363525390625, 0.234344482421875, 0.2445526123046875, 0.2547607421875, 0.2649688720703125, 0.275177001953125, 0.2853851318359375, 0.29559326171875, 0.3058013916015625, 0.316009521484375, 0.3262176513671875, 0.33642578125]}, "gradients/decoder.model.decoder.layers.3.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 7.0, 7.0, 7.0, 12.0, 17.0, 16.0, 20.0, 36.0, 31.0, 46.0, 51.0, 59.0, 69.0, 77.0, 85.0, 67.0, 61.0, 55.0, 42.0, 43.0, 27.0, 33.0, 22.0, 17.0, 18.0, 6.0, 13.0, 6.0, 5.0, 5.0, 5.0, 5.0, 2.0, 3.0, 5.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.08001708984375, -0.07799243927001953, -0.07596778869628906, -0.0739431381225586, -0.07191848754882812, -0.06989383697509766, -0.06786918640136719, -0.06584453582763672, -0.06381988525390625, -0.06179523468017578, -0.05977058410644531, -0.057745933532714844, -0.055721282958984375, -0.053696632385253906, -0.05167198181152344, -0.04964733123779297, -0.0476226806640625, -0.04559803009033203, -0.04357337951660156, -0.041548728942871094, -0.039524078369140625, -0.037499427795410156, -0.03547477722167969, -0.03345012664794922, -0.03142547607421875, -0.02940082550048828, -0.027376174926757812, -0.025351524353027344, -0.023326873779296875, -0.021302223205566406, -0.019277572631835938, -0.01725292205810547, -0.015228271484375, -0.013203620910644531, -0.011178970336914062, -0.009154319763183594, -0.007129669189453125, -0.005105018615722656, -0.0030803680419921875, -0.0010557174682617188, 0.00096893310546875, 0.0029935836791992188, 0.0050182342529296875, 0.007042884826660156, 0.009067535400390625, 0.011092185974121094, 0.013116836547851562, 0.015141487121582031, 0.0171661376953125, 0.01919078826904297, 0.021215438842773438, 0.023240089416503906, 0.025264739990234375, 0.027289390563964844, 0.029314041137695312, 0.03133869171142578, 0.03336334228515625, 0.03538799285888672, 0.03741264343261719, 0.039437294006347656, 0.041461944580078125, 0.043486595153808594, 0.04551124572753906, 0.04753589630126953, 0.049560546875]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 8.0, 12.0, 32.0, 47.0, 97.0, 105.0, 133.0, 137.0, 141.0, 113.0, 70.0, 52.0, 24.0, 19.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0], "bins": [-29.67615509033203, -29.098651885986328, -28.521148681640625, -27.943647384643555, -27.36614418029785, -26.78864097595215, -26.211137771606445, -25.633634567260742, -25.056133270263672, -24.47863006591797, -23.901126861572266, -23.323625564575195, -22.746122360229492, -22.16861915588379, -21.591115951538086, -21.013612747192383, -20.43610954284668, -19.858606338500977, -19.281103134155273, -18.703601837158203, -18.1260986328125, -17.548595428466797, -16.971092224121094, -16.39358901977539, -15.816086769104004, -15.2385835647583, -14.661081314086914, -14.083578109741211, -13.506074905395508, -12.928572654724121, -12.351069450378418, -11.773567199707031, -11.196063041687012, -10.618559837341309, -10.041057586669922, -9.463554382324219, -8.886051177978516, -8.308548927307129, -7.731045722961426, -7.153542995452881, -6.576040267944336, -5.998537540435791, -5.421034812927246, -4.843531608581543, -4.266028881072998, -3.688526153564453, -3.111023187637329, -2.533520221710205, -1.9560174942016602, -1.3785146474838257, -0.8010118007659912, -0.22350895404815674, 0.35399389266967773, 0.9314966201782227, 1.5089995861053467, 2.0865025520324707, 2.6640052795410156, 3.2415080070495605, 3.8190109729766846, 4.396513938903809, 4.9740166664123535, 5.551519393920898, 6.129022598266602, 6.7065253257751465, 7.284028053283691]}, "gradients/decoder.model.decoder.layers.3.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 6.0, 3.0, 9.0, 5.0, 12.0, 12.0, 14.0, 16.0, 26.0, 21.0, 27.0, 30.0, 34.0, 34.0, 37.0, 30.0, 44.0, 41.0, 47.0, 44.0, 42.0, 39.0, 46.0, 29.0, 39.0, 36.0, 24.0, 27.0, 34.0, 29.0, 22.0, 20.0, 15.0, 17.0, 12.0, 13.0, 10.0, 11.0, 8.0, 10.0, 5.0, 2.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.985445022583008, -7.7389607429504395, -7.492475986480713, -7.2459917068481445, -6.999506950378418, -6.75302267074585, -6.506538391113281, -6.260053634643555, -6.013569355010986, -5.767085075378418, -5.520600318908691, -5.274116039276123, -5.027631759643555, -4.781147003173828, -4.53466272354126, -4.288178443908691, -4.041693687438965, -3.7952091693878174, -3.54872465133667, -3.3022403717041016, -3.055755853652954, -2.8092713356018066, -2.5627870559692383, -2.316302537918091, -2.0698180198669434, -1.823333501815796, -1.576849102973938, -1.33036470413208, -1.0838801860809326, -0.8373956680297852, -0.5909112691879272, -0.34442687034606934, -0.09794235229492188, 0.1485421061515808, 0.3950265645980835, 0.6415110230445862, 0.8879954814910889, 1.1344799995422363, 1.3809643983840942, 1.6274487972259521, 1.8739333152770996, 2.120417833328247, 2.3669023513793945, 2.613386631011963, 2.8598711490631104, 3.106355667114258, 3.352839946746826, 3.5993244647979736, 3.845808982849121, 4.0922932624816895, 4.338778018951416, 4.585262298583984, 4.831747055053711, 5.078231334686279, 5.324715614318848, 5.571200370788574, 5.817684650421143, 6.064168930053711, 6.3106536865234375, 6.557137966156006, 6.803622245788574, 7.050107002258301, 7.296591281890869, 7.5430755615234375, 7.789560317993164]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 1.0, 7.0, 8.0, 12.0, 20.0, 33.0, 42.0, 58.0, 82.0, 128.0, 190.0, 342.0, 749.0, 1712.0, 4464.0, 12365.0, 36166.0, 113947.0, 569123.0, 221040.0, 57195.0, 19219.0, 6838.0, 2526.0, 1050.0, 510.0, 268.0, 152.0, 90.0, 64.0, 44.0, 22.0, 25.0, 11.0, 13.0, 8.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-10.296875, -9.97216796875, -9.6474609375, -9.32275390625, -8.998046875, -8.67333984375, -8.3486328125, -8.02392578125, -7.69921875, -7.37451171875, -7.0498046875, -6.72509765625, -6.400390625, -6.07568359375, -5.7509765625, -5.42626953125, -5.1015625, -4.77685546875, -4.4521484375, -4.12744140625, -3.802734375, -3.47802734375, -3.1533203125, -2.82861328125, -2.50390625, -2.17919921875, -1.8544921875, -1.52978515625, -1.205078125, -0.88037109375, -0.5556640625, -0.23095703125, 0.09375, 0.41845703125, 0.7431640625, 1.06787109375, 1.392578125, 1.71728515625, 2.0419921875, 2.36669921875, 2.69140625, 3.01611328125, 3.3408203125, 3.66552734375, 3.990234375, 4.31494140625, 4.6396484375, 4.96435546875, 5.2890625, 5.61376953125, 5.9384765625, 6.26318359375, 6.587890625, 6.91259765625, 7.2373046875, 7.56201171875, 7.88671875, 8.21142578125, 8.5361328125, 8.86083984375, 9.185546875, 9.51025390625, 9.8349609375, 10.15966796875, 10.484375]}, "gradients/decoder.model.decoder.layers.3.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 7.0, 8.0, 10.0, 14.0, 14.0, 18.0, 27.0, 33.0, 22.0, 31.0, 26.0, 33.0, 37.0, 41.0, 44.0, 43.0, 47.0, 46.0, 38.0, 48.0, 30.0, 31.0, 26.0, 26.0, 26.0, 42.0, 30.0, 27.0, 19.0, 21.0, 17.0, 14.0, 10.0, 7.0, 14.0, 13.0, 9.0, 7.0, 4.0, 6.0, 6.0, 1.0, 3.0, 6.0, 3.0, 1.0, 1.0], "bins": [-16.484375, -16.01416015625, -15.5439453125, -15.07373046875, -14.603515625, -14.13330078125, -13.6630859375, -13.19287109375, -12.72265625, -12.25244140625, -11.7822265625, -11.31201171875, -10.841796875, -10.37158203125, -9.9013671875, -9.43115234375, -8.9609375, -8.49072265625, -8.0205078125, -7.55029296875, -7.080078125, -6.60986328125, -6.1396484375, -5.66943359375, -5.19921875, -4.72900390625, -4.2587890625, -3.78857421875, -3.318359375, -2.84814453125, -2.3779296875, -1.90771484375, -1.4375, -0.96728515625, -0.4970703125, -0.02685546875, 0.443359375, 0.91357421875, 1.3837890625, 1.85400390625, 2.32421875, 2.79443359375, 3.2646484375, 3.73486328125, 4.205078125, 4.67529296875, 5.1455078125, 5.61572265625, 6.0859375, 6.55615234375, 7.0263671875, 7.49658203125, 7.966796875, 8.43701171875, 8.9072265625, 9.37744140625, 9.84765625, 10.31787109375, 10.7880859375, 11.25830078125, 11.728515625, 12.19873046875, 12.6689453125, 13.13916015625, 13.609375]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 8.0, 9.0, 8.0, 15.0, 18.0, 21.0, 30.0, 40.0, 52.0, 98.0, 107.0, 161.0, 261.0, 412.0, 955.0, 5575.0, 122487.0, 885525.0, 29030.0, 2028.0, 628.0, 344.0, 213.0, 157.0, 93.0, 63.0, 46.0, 49.0, 25.0, 15.0, 15.0, 12.0, 7.0, 7.0, 11.0, 9.0, 6.0, 4.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.546875, -24.643798828125, -23.74072265625, -22.837646484375, -21.9345703125, -21.031494140625, -20.12841796875, -19.225341796875, -18.322265625, -17.419189453125, -16.51611328125, -15.613037109375, -14.7099609375, -13.806884765625, -12.90380859375, -12.000732421875, -11.09765625, -10.194580078125, -9.29150390625, -8.388427734375, -7.4853515625, -6.582275390625, -5.67919921875, -4.776123046875, -3.873046875, -2.969970703125, -2.06689453125, -1.163818359375, -0.2607421875, 0.642333984375, 1.54541015625, 2.448486328125, 3.3515625, 4.254638671875, 5.15771484375, 6.060791015625, 6.9638671875, 7.866943359375, 8.77001953125, 9.673095703125, 10.576171875, 11.479248046875, 12.38232421875, 13.285400390625, 14.1884765625, 15.091552734375, 15.99462890625, 16.897705078125, 17.80078125, 18.703857421875, 19.60693359375, 20.510009765625, 21.4130859375, 22.316162109375, 23.21923828125, 24.122314453125, 25.025390625, 25.928466796875, 26.83154296875, 27.734619140625, 28.6376953125, 29.540771484375, 30.44384765625, 31.346923828125, 32.25]}, "gradients/decoder.model.decoder.layers.3.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 5.0, 8.0, 8.0, 16.0, 19.0, 25.0, 23.0, 31.0, 44.0, 41.0, 55.0, 58.0, 65.0, 65.0, 63.0, 44.0, 65.0, 60.0, 50.0, 48.0, 29.0, 46.0, 30.0, 16.0, 13.0, 18.0, 7.0, 12.0, 5.0, 4.0, 11.0, 3.0, 7.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.109375, -19.283935546875, -18.45849609375, -17.633056640625, -16.8076171875, -15.982177734375, -15.15673828125, -14.331298828125, -13.505859375, -12.680419921875, -11.85498046875, -11.029541015625, -10.2041015625, -9.378662109375, -8.55322265625, -7.727783203125, -6.90234375, -6.076904296875, -5.25146484375, -4.426025390625, -3.6005859375, -2.775146484375, -1.94970703125, -1.124267578125, -0.298828125, 0.526611328125, 1.35205078125, 2.177490234375, 3.0029296875, 3.828369140625, 4.65380859375, 5.479248046875, 6.3046875, 7.130126953125, 7.95556640625, 8.781005859375, 9.6064453125, 10.431884765625, 11.25732421875, 12.082763671875, 12.908203125, 13.733642578125, 14.55908203125, 15.384521484375, 16.2099609375, 17.035400390625, 17.86083984375, 18.686279296875, 19.51171875, 20.337158203125, 21.16259765625, 21.988037109375, 22.8134765625, 23.638916015625, 24.46435546875, 25.289794921875, 26.115234375, 26.940673828125, 27.76611328125, 28.591552734375, 29.4169921875, 30.242431640625, 31.06787109375, 31.893310546875, 32.71875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 7.0, 11.0, 20.0, 53.0, 82.0, 146.0, 334.0, 714.0, 1922.0, 16704.0, 961809.0, 62042.0, 3048.0, 843.0, 383.0, 215.0, 96.0, 64.0, 24.0, 11.0, 8.0, 8.0, 7.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1640625, -14.71337890625, -14.2626953125, -13.81201171875, -13.361328125, -12.91064453125, -12.4599609375, -12.00927734375, -11.55859375, -11.10791015625, -10.6572265625, -10.20654296875, -9.755859375, -9.30517578125, -8.8544921875, -8.40380859375, -7.953125, -7.50244140625, -7.0517578125, -6.60107421875, -6.150390625, -5.69970703125, -5.2490234375, -4.79833984375, -4.34765625, -3.89697265625, -3.4462890625, -2.99560546875, -2.544921875, -2.09423828125, -1.6435546875, -1.19287109375, -0.7421875, -0.29150390625, 0.1591796875, 0.60986328125, 1.060546875, 1.51123046875, 1.9619140625, 2.41259765625, 2.86328125, 3.31396484375, 3.7646484375, 4.21533203125, 4.666015625, 5.11669921875, 5.5673828125, 6.01806640625, 6.46875, 6.91943359375, 7.3701171875, 7.82080078125, 8.271484375, 8.72216796875, 9.1728515625, 9.62353515625, 10.07421875, 10.52490234375, 10.9755859375, 11.42626953125, 11.876953125, 12.32763671875, 12.7783203125, 13.22900390625, 13.6796875]}, "gradients/decoder.model.decoder.layers.3.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 3.0, 3.0, 9.0, 10.0, 15.0, 23.0, 60.0, 85.0, 262.0, 316.0, 86.0, 53.0, 39.0, 15.0, 13.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001102447509765625, -0.0010473430156707764, -0.0009922385215759277, -0.0009371340274810791, -0.0008820295333862305, -0.0008269250392913818, -0.0007718205451965332, -0.0007167160511016846, -0.0006616115570068359, -0.0006065070629119873, -0.0005514025688171387, -0.00049629807472229, -0.0004411935806274414, -0.0003860890865325928, -0.00033098459243774414, -0.0002758800983428955, -0.00022077560424804688, -0.00016567111015319824, -0.00011056661605834961, -5.5462121963500977e-05, -3.5762786865234375e-07, 5.474686622619629e-05, 0.00010985136032104492, 0.00016495585441589355, 0.0002200603485107422, 0.0002751648426055908, 0.00033026933670043945, 0.0003853738307952881, 0.0004404783248901367, 0.0004955828189849854, 0.000550687313079834, 0.0006057918071746826, 0.0006608963012695312, 0.0007160007953643799, 0.0007711052894592285, 0.0008262097835540771, 0.0008813142776489258, 0.0009364187717437744, 0.000991523265838623, 0.0010466277599334717, 0.0011017322540283203, 0.001156836748123169, 0.0012119412422180176, 0.0012670457363128662, 0.0013221502304077148, 0.0013772547245025635, 0.0014323592185974121, 0.0014874637126922607, 0.0015425682067871094, 0.001597672700881958, 0.0016527771949768066, 0.0017078816890716553, 0.001762986183166504, 0.0018180906772613525, 0.0018731951713562012, 0.0019282996654510498, 0.0019834041595458984, 0.002038508653640747, 0.0020936131477355957, 0.0021487176418304443, 0.002203822135925293, 0.0022589266300201416, 0.0023140311241149902, 0.002369135618209839, 0.0024242401123046875]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 5.0, 9.0, 21.0, 24.0, 40.0, 45.0, 70.0, 83.0, 116.0, 155.0, 226.0, 325.0, 537.0, 996.0, 3282.0, 21470.0, 339076.0, 647020.0, 28385.0, 3867.0, 1149.0, 500.0, 326.0, 244.0, 163.0, 114.0, 90.0, 71.0, 42.0, 31.0, 21.0, 9.0, 13.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.4375, -7.16259765625, -6.8876953125, -6.61279296875, -6.337890625, -6.06298828125, -5.7880859375, -5.51318359375, -5.23828125, -4.96337890625, -4.6884765625, -4.41357421875, -4.138671875, -3.86376953125, -3.5888671875, -3.31396484375, -3.0390625, -2.76416015625, -2.4892578125, -2.21435546875, -1.939453125, -1.66455078125, -1.3896484375, -1.11474609375, -0.83984375, -0.56494140625, -0.2900390625, -0.01513671875, 0.259765625, 0.53466796875, 0.8095703125, 1.08447265625, 1.359375, 1.63427734375, 1.9091796875, 2.18408203125, 2.458984375, 2.73388671875, 3.0087890625, 3.28369140625, 3.55859375, 3.83349609375, 4.1083984375, 4.38330078125, 4.658203125, 4.93310546875, 5.2080078125, 5.48291015625, 5.7578125, 6.03271484375, 6.3076171875, 6.58251953125, 6.857421875, 7.13232421875, 7.4072265625, 7.68212890625, 7.95703125, 8.23193359375, 8.5068359375, 8.78173828125, 9.056640625, 9.33154296875, 9.6064453125, 9.88134765625, 10.15625]}, "gradients/decoder.model.decoder.layers.3.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 11.0, 8.0, 12.0, 13.0, 25.0, 11.0, 17.0, 33.0, 37.0, 58.0, 54.0, 175.0, 194.0, 68.0, 52.0, 49.0, 41.0, 40.0, 21.0, 12.0, 14.0, 11.0, 10.0, 8.0, 9.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.431640625, -2.3660736083984375, -2.300506591796875, -2.2349395751953125, -2.16937255859375, -2.1038055419921875, -2.038238525390625, -1.9726715087890625, -1.9071044921875, -1.8415374755859375, -1.775970458984375, -1.7104034423828125, -1.64483642578125, -1.5792694091796875, -1.513702392578125, -1.4481353759765625, -1.382568359375, -1.3170013427734375, -1.251434326171875, -1.1858673095703125, -1.12030029296875, -1.0547332763671875, -0.989166259765625, -0.9235992431640625, -0.8580322265625, -0.7924652099609375, -0.726898193359375, -0.6613311767578125, -0.59576416015625, -0.5301971435546875, -0.464630126953125, -0.3990631103515625, -0.33349609375, -0.2679290771484375, -0.202362060546875, -0.1367950439453125, -0.07122802734375, -0.0056610107421875, 0.059906005859375, 0.1254730224609375, 0.1910400390625, 0.2566070556640625, 0.322174072265625, 0.3877410888671875, 0.45330810546875, 0.5188751220703125, 0.584442138671875, 0.6500091552734375, 0.715576171875, 0.7811431884765625, 0.846710205078125, 0.9122772216796875, 0.97784423828125, 1.0434112548828125, 1.108978271484375, 1.1745452880859375, 1.2401123046875, 1.3056793212890625, 1.371246337890625, 1.4368133544921875, 1.50238037109375, 1.5679473876953125, 1.633514404296875, 1.6990814208984375, 1.7646484375]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 10.0, 15.0, 75.0, 150.0, 258.0, 261.0, 150.0, 62.0, 20.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.316856384277344, -25.951107025146484, -23.585357666015625, -21.2196102142334, -18.85386085510254, -16.48811149597168, -14.122363090515137, -11.756614685058594, -9.390865325927734, -7.025116443634033, -4.659367561340332, -2.293618679046631, 0.07213020324707031, 2.4378795623779297, 4.803627967834473, 7.169376373291016, 9.535125732421875, 11.900875091552734, 14.266623497009277, 16.63237190246582, 18.99812126159668, 21.36387062072754, 23.729618072509766, 26.095367431640625, 28.461116790771484, 30.826866149902344, 33.1926155090332, 35.55836486816406, 37.924110412597656, 40.28986358642578, 42.655609130859375, 45.021358489990234, 47.38710021972656, 49.75284957885742, 52.11859893798828, 54.48434829711914, 56.85009765625, 59.215843200683594, 61.58159255981445, 63.94734191894531, 66.31309509277344, 68.67884063720703, 71.04459381103516, 73.41033935546875, 75.77609252929688, 78.14183807373047, 80.5075912475586, 82.87333679199219, 85.23908233642578, 87.60482788085938, 89.9705810546875, 92.3363265991211, 94.70207977294922, 97.06782531738281, 99.43357849121094, 101.79932403564453, 104.16506958007812, 106.53081512451172, 108.89656829833984, 111.26231384277344, 113.62806701660156, 115.99381256103516, 118.35956573486328, 120.72531127929688, 123.091064453125]}, "gradients/decoder.model.decoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 6.0, 10.0, 13.0, 8.0, 14.0, 11.0, 14.0, 21.0, 24.0, 24.0, 27.0, 27.0, 27.0, 25.0, 39.0, 32.0, 36.0, 38.0, 31.0, 52.0, 41.0, 33.0, 36.0, 42.0, 33.0, 32.0, 27.0, 32.0, 32.0, 30.0, 21.0, 30.0, 25.0, 13.0, 13.0, 17.0, 8.0, 9.0, 13.0, 7.0, 10.0, 3.0, 0.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-29.678855895996094, -28.77014923095703, -27.86144256591797, -26.95273780822754, -26.044031143188477, -25.135324478149414, -24.226619720458984, -23.317913055419922, -22.40920639038086, -21.500499725341797, -20.591793060302734, -19.683088302612305, -18.774381637573242, -17.86567497253418, -16.95697021484375, -16.048263549804688, -15.139556884765625, -14.230850219726562, -13.322144508361816, -12.41343879699707, -11.504732131958008, -10.596025466918945, -9.6873197555542, -8.778614044189453, -7.869907379150391, -6.961201190948486, -6.052495002746582, -5.143788814544678, -4.235082626342773, -3.326376438140869, -2.417670249938965, -1.5089640617370605, -0.6002578735351562, 0.30844831466674805, 1.2171545028686523, 2.1258606910705566, 3.034566879272461, 3.9432730674743652, 4.8519792556762695, 5.760685443878174, 6.669391632080078, 7.578097820281982, 8.486804008483887, 9.395509719848633, 10.304216384887695, 11.212923049926758, 12.121628761291504, 13.03033447265625, 13.939041137695312, 14.847747802734375, 15.756453514099121, 16.665159225463867, 17.57386589050293, 18.482572555541992, 19.391277313232422, 20.299983978271484, 21.208690643310547, 22.11739730834961, 23.026103973388672, 23.9348087310791, 24.843515396118164, 25.752222061157227, 26.660926818847656, 27.56963348388672, 28.47834014892578]}, "gradients/decoder.model.decoder.layers.2.fc2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 3.0, 11.0, 6.0, 12.0, 4.0, 19.0, 12.0, 9.0, 23.0, 26.0, 28.0, 23.0, 26.0, 32.0, 39.0, 54.0, 104.0, 181.0, 577.0, 3686.0, 154123.0, 3936650.0, 94592.0, 2942.0, 477.0, 191.0, 86.0, 60.0, 48.0, 36.0, 31.0, 28.0, 24.0, 17.0, 16.0, 19.0, 13.0, 12.0, 10.0, 11.0, 2.0, 4.0, 4.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-46.71875, -45.2333984375, -43.748046875, -42.2626953125, -40.77734375, -39.2919921875, -37.806640625, -36.3212890625, -34.8359375, -33.3505859375, -31.865234375, -30.3798828125, -28.89453125, -27.4091796875, -25.923828125, -24.4384765625, -22.953125, -21.4677734375, -19.982421875, -18.4970703125, -17.01171875, -15.5263671875, -14.041015625, -12.5556640625, -11.0703125, -9.5849609375, -8.099609375, -6.6142578125, -5.12890625, -3.6435546875, -2.158203125, -0.6728515625, 0.8125, 2.2978515625, 3.783203125, 5.2685546875, 6.75390625, 8.2392578125, 9.724609375, 11.2099609375, 12.6953125, 14.1806640625, 15.666015625, 17.1513671875, 18.63671875, 20.1220703125, 21.607421875, 23.0927734375, 24.578125, 26.0634765625, 27.548828125, 29.0341796875, 30.51953125, 32.0048828125, 33.490234375, 34.9755859375, 36.4609375, 37.9462890625, 39.431640625, 40.9169921875, 42.40234375, 43.8876953125, 45.373046875, 46.8583984375, 48.34375]}, "gradients/decoder.model.decoder.layers.2.fc2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 7.0, 5.0, 7.0, 3.0, 10.0, 14.0, 8.0, 13.0, 12.0, 19.0, 21.0, 26.0, 30.0, 38.0, 34.0, 37.0, 32.0, 35.0, 40.0, 44.0, 42.0, 44.0, 33.0, 44.0, 45.0, 32.0, 42.0, 34.0, 32.0, 21.0, 32.0, 20.0, 21.0, 19.0, 17.0, 9.0, 6.0, 13.0, 13.0, 12.0, 11.0, 11.0, 2.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-9.40625, -9.11962890625, -8.8330078125, -8.54638671875, -8.259765625, -7.97314453125, -7.6865234375, -7.39990234375, -7.11328125, -6.82666015625, -6.5400390625, -6.25341796875, -5.966796875, -5.68017578125, -5.3935546875, -5.10693359375, -4.8203125, -4.53369140625, -4.2470703125, -3.96044921875, -3.673828125, -3.38720703125, -3.1005859375, -2.81396484375, -2.52734375, -2.24072265625, -1.9541015625, -1.66748046875, -1.380859375, -1.09423828125, -0.8076171875, -0.52099609375, -0.234375, 0.05224609375, 0.3388671875, 0.62548828125, 0.912109375, 1.19873046875, 1.4853515625, 1.77197265625, 2.05859375, 2.34521484375, 2.6318359375, 2.91845703125, 3.205078125, 3.49169921875, 3.7783203125, 4.06494140625, 4.3515625, 4.63818359375, 4.9248046875, 5.21142578125, 5.498046875, 5.78466796875, 6.0712890625, 6.35791015625, 6.64453125, 6.93115234375, 7.2177734375, 7.50439453125, 7.791015625, 8.07763671875, 8.3642578125, 8.65087890625, 8.9375]}, "gradients/decoder.model.decoder.layers.2.fc1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 9.0, 9.0, 19.0, 43.0, 94.0, 147.0, 349.0, 1079.0, 4260.0, 41040.0, 3202656.0, 923268.0, 17368.0, 2629.0, 756.0, 276.0, 121.0, 78.0, 29.0, 12.0, 15.0, 7.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.46875, -44.431884765625, -43.39501953125, -42.358154296875, -41.3212890625, -40.284423828125, -39.24755859375, -38.210693359375, -37.173828125, -36.136962890625, -35.10009765625, -34.063232421875, -33.0263671875, -31.989501953125, -30.95263671875, -29.915771484375, -28.87890625, -27.842041015625, -26.80517578125, -25.768310546875, -24.7314453125, -23.694580078125, -22.65771484375, -21.620849609375, -20.583984375, -19.547119140625, -18.51025390625, -17.473388671875, -16.4365234375, -15.399658203125, -14.36279296875, -13.325927734375, -12.2890625, -11.252197265625, -10.21533203125, -9.178466796875, -8.1416015625, -7.104736328125, -6.06787109375, -5.031005859375, -3.994140625, -2.957275390625, -1.92041015625, -0.883544921875, 0.1533203125, 1.190185546875, 2.22705078125, 3.263916015625, 4.30078125, 5.337646484375, 6.37451171875, 7.411376953125, 8.4482421875, 9.485107421875, 10.52197265625, 11.558837890625, 12.595703125, 13.632568359375, 14.66943359375, 15.706298828125, 16.7431640625, 17.780029296875, 18.81689453125, 19.853759765625, 20.890625]}, "gradients/decoder.model.decoder.layers.2.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 1.0, 5.0, 9.0, 13.0, 13.0, 25.0, 30.0, 58.0, 69.0, 113.0, 158.0, 256.0, 393.0, 533.0, 614.0, 550.0, 409.0, 264.0, 182.0, 128.0, 96.0, 47.0, 30.0, 24.0, 16.0, 8.0, 6.0, 3.0, 6.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.80078125, -5.6279296875, -5.455078125, -5.2822265625, -5.109375, -4.9365234375, -4.763671875, -4.5908203125, -4.41796875, -4.2451171875, -4.072265625, -3.8994140625, -3.7265625, -3.5537109375, -3.380859375, -3.2080078125, -3.03515625, -2.8623046875, -2.689453125, -2.5166015625, -2.34375, -2.1708984375, -1.998046875, -1.8251953125, -1.65234375, -1.4794921875, -1.306640625, -1.1337890625, -0.9609375, -0.7880859375, -0.615234375, -0.4423828125, -0.26953125, -0.0966796875, 0.076171875, 0.2490234375, 0.421875, 0.5947265625, 0.767578125, 0.9404296875, 1.11328125, 1.2861328125, 1.458984375, 1.6318359375, 1.8046875, 1.9775390625, 2.150390625, 2.3232421875, 2.49609375, 2.6689453125, 2.841796875, 3.0146484375, 3.1875, 3.3603515625, 3.533203125, 3.7060546875, 3.87890625, 4.0517578125, 4.224609375, 4.3974609375, 4.5703125, 4.7431640625, 4.916015625, 5.0888671875, 5.26171875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 9.0, 12.0, 23.0, 25.0, 41.0, 56.0, 69.0, 81.0, 82.0, 95.0, 88.0, 89.0, 79.0, 63.0, 63.0, 40.0, 32.0, 21.0, 9.0, 8.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-28.630205154418945, -28.005146026611328, -27.38008689880371, -26.75502586364746, -26.129966735839844, -25.504907608032227, -24.87984848022461, -24.254789352416992, -23.629730224609375, -23.004671096801758, -22.37961196899414, -21.75455093383789, -21.129491806030273, -20.504432678222656, -19.87937355041504, -19.254314422607422, -18.629253387451172, -18.004194259643555, -17.379135131835938, -16.754074096679688, -16.12901496887207, -15.503955841064453, -14.878896713256836, -14.253837585449219, -13.628777503967285, -13.003718376159668, -12.378658294677734, -11.753599166870117, -11.1285400390625, -10.503479957580566, -9.87842082977295, -9.253360748291016, -8.628301620483398, -8.003242492675781, -7.378182411193848, -6.7531232833862305, -6.128063678741455, -5.50300407409668, -4.8779449462890625, -4.252885341644287, -3.6278257369995117, -3.0027661323547363, -2.37770676612854, -1.7526472806930542, -1.1275877952575684, -0.502528190612793, 0.12253117561340332, 0.7475905418395996, 1.372650146484375, 1.9977096319198608, 2.6227691173553467, 3.247828483581543, 3.8728880882263184, 4.497947692871094, 5.123006820678711, 5.748066425323486, 6.373126029968262, 6.998185634613037, 7.6232452392578125, 8.24830436706543, 8.873363494873047, 9.49842357635498, 10.123482704162598, 10.748542785644531, 11.373601913452148]}, "gradients/decoder.model.decoder.layers.2.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 6.0, 8.0, 4.0, 16.0, 13.0, 9.0, 8.0, 16.0, 24.0, 21.0, 25.0, 23.0, 34.0, 28.0, 35.0, 32.0, 34.0, 32.0, 40.0, 42.0, 32.0, 40.0, 34.0, 46.0, 35.0, 28.0, 37.0, 33.0, 36.0, 23.0, 20.0, 26.0, 21.0, 17.0, 23.0, 13.0, 15.0, 12.0, 14.0, 6.0, 8.0, 6.0, 5.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.711785316467285, -9.388851165771484, -9.065916061401367, -8.742981910705566, -8.420047760009766, -8.097112655639648, -7.774178504943848, -7.451244354248047, -7.128309726715088, -6.805375099182129, -6.482440948486328, -6.159506320953369, -5.83657169342041, -5.513637542724609, -5.19070291519165, -4.867768287658691, -4.544834136962891, -4.221899509429932, -3.898965358734131, -3.576030731201172, -3.253096342086792, -2.930161952972412, -2.607227325439453, -2.2842929363250732, -1.9613585472106934, -1.6384241580963135, -1.315489649772644, -0.9925552010536194, -0.6696207523345947, -0.34668636322021484, -0.02375185489654541, 0.299182653427124, 0.6221179962158203, 0.945052444934845, 1.2679868936538696, 1.590921401977539, 1.913855791091919, 2.236790180206299, 2.559724807739258, 2.8826591968536377, 3.2055935859680176, 3.5285279750823975, 3.8514623641967773, 4.174396991729736, 4.497331619262695, 4.820265769958496, 5.143200397491455, 5.466135025024414, 5.789069175720215, 6.112003803253174, 6.434937953948975, 6.757872581481934, 7.080806732177734, 7.403741359710693, 7.726675987243652, 8.049610137939453, 8.37254524230957, 8.695479393005371, 9.018414497375488, 9.341348648071289, 9.66428279876709, 9.98721694946289, 10.310152053833008, 10.633086204528809, 10.95602035522461]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 5.0, 10.0, 5.0, 21.0, 13.0, 28.0, 55.0, 81.0, 112.0, 166.0, 233.0, 369.0, 665.0, 1350.0, 3463.0, 11525.0, 48012.0, 226071.0, 495360.0, 201375.0, 43266.0, 10264.0, 3153.0, 1281.0, 637.0, 372.0, 224.0, 141.0, 100.0, 54.0, 51.0, 32.0, 27.0, 16.0, 11.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.431640625, -3.311065673828125, -3.19049072265625, -3.069915771484375, -2.9493408203125, -2.828765869140625, -2.70819091796875, -2.587615966796875, -2.467041015625, -2.346466064453125, -2.22589111328125, -2.105316162109375, -1.9847412109375, -1.864166259765625, -1.74359130859375, -1.623016357421875, -1.50244140625, -1.381866455078125, -1.26129150390625, -1.140716552734375, -1.0201416015625, -0.899566650390625, -0.77899169921875, -0.658416748046875, -0.537841796875, -0.417266845703125, -0.29669189453125, -0.176116943359375, -0.0555419921875, 0.065032958984375, 0.18560791015625, 0.306182861328125, 0.4267578125, 0.547332763671875, 0.66790771484375, 0.788482666015625, 0.9090576171875, 1.029632568359375, 1.15020751953125, 1.270782470703125, 1.391357421875, 1.511932373046875, 1.63250732421875, 1.753082275390625, 1.8736572265625, 1.994232177734375, 2.11480712890625, 2.235382080078125, 2.35595703125, 2.476531982421875, 2.59710693359375, 2.717681884765625, 2.8382568359375, 2.958831787109375, 3.07940673828125, 3.199981689453125, 3.320556640625, 3.441131591796875, 3.56170654296875, 3.682281494140625, 3.8028564453125, 3.923431396484375, 4.04400634765625, 4.164581298828125, 4.28515625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 11.0, 10.0, 14.0, 17.0, 15.0, 22.0, 24.0, 30.0, 37.0, 42.0, 40.0, 48.0, 37.0, 44.0, 50.0, 42.0, 54.0, 56.0, 54.0, 52.0, 41.0, 40.0, 41.0, 28.0, 36.0, 22.0, 25.0, 19.0, 13.0, 7.0, 5.0, 7.0, 5.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0], "bins": [-12.078125, -11.76953125, -11.4609375, -11.15234375, -10.84375, -10.53515625, -10.2265625, -9.91796875, -9.609375, -9.30078125, -8.9921875, -8.68359375, -8.375, -8.06640625, -7.7578125, -7.44921875, -7.140625, -6.83203125, -6.5234375, -6.21484375, -5.90625, -5.59765625, -5.2890625, -4.98046875, -4.671875, -4.36328125, -4.0546875, -3.74609375, -3.4375, -3.12890625, -2.8203125, -2.51171875, -2.203125, -1.89453125, -1.5859375, -1.27734375, -0.96875, -0.66015625, -0.3515625, -0.04296875, 0.265625, 0.57421875, 0.8828125, 1.19140625, 1.5, 1.80859375, 2.1171875, 2.42578125, 2.734375, 3.04296875, 3.3515625, 3.66015625, 3.96875, 4.27734375, 4.5859375, 4.89453125, 5.203125, 5.51171875, 5.8203125, 6.12890625, 6.4375, 6.74609375, 7.0546875, 7.36328125, 7.671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 9.0, 13.0, 12.0, 26.0, 57.0, 59.0, 126.0, 188.0, 323.0, 474.0, 933.0, 1708.0, 3354.0, 6438.0, 12571.0, 25107.0, 50701.0, 98708.0, 173203.0, 233082.0, 197116.0, 118271.0, 62274.0, 31338.0, 15905.0, 7796.0, 4040.0, 2080.0, 1129.0, 639.0, 360.0, 176.0, 144.0, 74.0, 45.0, 22.0, 17.0, 16.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-1.599609375, -1.55712890625, -1.5146484375, -1.47216796875, -1.4296875, -1.38720703125, -1.3447265625, -1.30224609375, -1.259765625, -1.21728515625, -1.1748046875, -1.13232421875, -1.08984375, -1.04736328125, -1.0048828125, -0.96240234375, -0.919921875, -0.87744140625, -0.8349609375, -0.79248046875, -0.75, -0.70751953125, -0.6650390625, -0.62255859375, -0.580078125, -0.53759765625, -0.4951171875, -0.45263671875, -0.41015625, -0.36767578125, -0.3251953125, -0.28271484375, -0.240234375, -0.19775390625, -0.1552734375, -0.11279296875, -0.0703125, -0.02783203125, 0.0146484375, 0.05712890625, 0.099609375, 0.14208984375, 0.1845703125, 0.22705078125, 0.26953125, 0.31201171875, 0.3544921875, 0.39697265625, 0.439453125, 0.48193359375, 0.5244140625, 0.56689453125, 0.609375, 0.65185546875, 0.6943359375, 0.73681640625, 0.779296875, 0.82177734375, 0.8642578125, 0.90673828125, 0.94921875, 0.99169921875, 1.0341796875, 1.07666015625, 1.119140625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 5.0, 5.0, 4.0, 7.0, 8.0, 7.0, 7.0, 15.0, 14.0, 18.0, 25.0, 31.0, 37.0, 48.0, 47.0, 58.0, 54.0, 56.0, 41.0, 60.0, 53.0, 47.0, 53.0, 52.0, 48.0, 45.0, 34.0, 15.0, 28.0, 19.0, 13.0, 11.0, 10.0, 5.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-25.3125, -24.638916015625, -23.96533203125, -23.291748046875, -22.6181640625, -21.944580078125, -21.27099609375, -20.597412109375, -19.923828125, -19.250244140625, -18.57666015625, -17.903076171875, -17.2294921875, -16.555908203125, -15.88232421875, -15.208740234375, -14.53515625, -13.861572265625, -13.18798828125, -12.514404296875, -11.8408203125, -11.167236328125, -10.49365234375, -9.820068359375, -9.146484375, -8.472900390625, -7.79931640625, -7.125732421875, -6.4521484375, -5.778564453125, -5.10498046875, -4.431396484375, -3.7578125, -3.084228515625, -2.41064453125, -1.737060546875, -1.0634765625, -0.389892578125, 0.28369140625, 0.957275390625, 1.630859375, 2.304443359375, 2.97802734375, 3.651611328125, 4.3251953125, 4.998779296875, 5.67236328125, 6.345947265625, 7.01953125, 7.693115234375, 8.36669921875, 9.040283203125, 9.7138671875, 10.387451171875, 11.06103515625, 11.734619140625, 12.408203125, 13.081787109375, 13.75537109375, 14.428955078125, 15.1025390625, 15.776123046875, 16.44970703125, 17.123291015625, 17.796875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 5.0, 6.0, 14.0, 9.0, 23.0, 23.0, 35.0, 52.0, 68.0, 111.0, 143.0, 174.0, 294.0, 451.0, 704.0, 1120.0, 1998.0, 3777.0, 8199.0, 20495.0, 58588.0, 178935.0, 379606.0, 255275.0, 86726.0, 29035.0, 11283.0, 5031.0, 2452.0, 1388.0, 840.0, 528.0, 371.0, 235.0, 161.0, 103.0, 87.0, 74.0, 40.0, 20.0, 23.0, 14.0, 13.0, 8.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.259765625, -0.25205230712890625, -0.2443389892578125, -0.23662567138671875, -0.228912353515625, -0.22119903564453125, -0.2134857177734375, -0.20577239990234375, -0.19805908203125, -0.19034576416015625, -0.1826324462890625, -0.17491912841796875, -0.167205810546875, -0.15949249267578125, -0.1517791748046875, -0.14406585693359375, -0.1363525390625, -0.12863922119140625, -0.1209259033203125, -0.11321258544921875, -0.105499267578125, -0.09778594970703125, -0.0900726318359375, -0.08235931396484375, -0.07464599609375, -0.06693267822265625, -0.0592193603515625, -0.05150604248046875, -0.043792724609375, -0.03607940673828125, -0.0283660888671875, -0.02065277099609375, -0.012939453125, -0.00522613525390625, 0.0024871826171875, 0.01020050048828125, 0.017913818359375, 0.02562713623046875, 0.0333404541015625, 0.04105377197265625, 0.04876708984375, 0.05648040771484375, 0.0641937255859375, 0.07190704345703125, 0.079620361328125, 0.08733367919921875, 0.0950469970703125, 0.10276031494140625, 0.1104736328125, 0.11818695068359375, 0.1259002685546875, 0.13361358642578125, 0.141326904296875, 0.14904022216796875, 0.1567535400390625, 0.16446685791015625, 0.17218017578125, 0.17989349365234375, 0.1876068115234375, 0.19532012939453125, 0.203033447265625, 0.21074676513671875, 0.2184600830078125, 0.22617340087890625, 0.23388671875]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 5.0, 15.0, 20.0, 13.0, 21.0, 22.0, 24.0, 34.0, 28.0, 47.0, 59.0, 58.0, 75.0, 71.0, 79.0, 62.0, 52.0, 51.0, 47.0, 32.0, 27.0, 23.0, 25.0, 14.0, 14.0, 13.0, 13.0, 7.0, 6.0, 9.0, 5.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.000164031982421875, -0.0001596761867403984, -0.00015532039105892181, -0.00015096459537744522, -0.00014660879969596863, -0.00014225300401449203, -0.00013789720833301544, -0.00013354141265153885, -0.00012918561697006226, -0.00012482982128858566, -0.00012047402560710907, -0.00011611822992563248, -0.00011176243424415588, -0.00010740663856267929, -0.0001030508428812027, -9.86950471997261e-05, -9.433925151824951e-05, -8.998345583677292e-05, -8.562766015529633e-05, -8.127186447381973e-05, -7.691606879234314e-05, -7.256027311086655e-05, -6.820447742938995e-05, -6.384868174791336e-05, -5.949288606643677e-05, -5.5137090384960175e-05, -5.078129470348358e-05, -4.642549902200699e-05, -4.2069703340530396e-05, -3.77139076590538e-05, -3.335811197757721e-05, -2.9002316296100616e-05, -2.4646520614624023e-05, -2.029072493314743e-05, -1.5934929251670837e-05, -1.1579133570194244e-05, -7.223337888717651e-06, -2.8675422072410583e-06, 1.4882534742355347e-06, 5.844049155712128e-06, 1.019984483718872e-05, 1.4555640518665314e-05, 1.8911436200141907e-05, 2.32672318816185e-05, 2.7623027563095093e-05, 3.1978823244571686e-05, 3.633461892604828e-05, 4.069041460752487e-05, 4.5046210289001465e-05, 4.940200597047806e-05, 5.375780165195465e-05, 5.8113597333431244e-05, 6.246939301490784e-05, 6.682518869638443e-05, 7.118098437786102e-05, 7.553678005933762e-05, 7.989257574081421e-05, 8.42483714222908e-05, 8.86041671037674e-05, 9.295996278524399e-05, 9.731575846672058e-05, 0.00010167155414819717, 0.00010602734982967377, 0.00011038314551115036, 0.00011473894119262695]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 0.0, 5.0, 7.0, 8.0, 6.0, 13.0, 26.0, 36.0, 40.0, 60.0, 83.0, 122.0, 238.0, 376.0, 713.0, 1484.0, 3301.0, 9294.0, 33064.0, 147851.0, 484777.0, 280052.0, 61772.0, 15888.0, 5010.0, 2058.0, 989.0, 510.0, 281.0, 160.0, 111.0, 72.0, 30.0, 30.0, 25.0, 16.0, 14.0, 3.0, 8.0, 10.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32861328125, -0.3182525634765625, -0.307891845703125, -0.2975311279296875, -0.28717041015625, -0.2768096923828125, -0.266448974609375, -0.2560882568359375, -0.2457275390625, -0.2353668212890625, -0.225006103515625, -0.2146453857421875, -0.20428466796875, -0.1939239501953125, -0.183563232421875, -0.1732025146484375, -0.162841796875, -0.1524810791015625, -0.142120361328125, -0.1317596435546875, -0.12139892578125, -0.1110382080078125, -0.100677490234375, -0.0903167724609375, -0.0799560546875, -0.0695953369140625, -0.059234619140625, -0.0488739013671875, -0.03851318359375, -0.0281524658203125, -0.017791748046875, -0.0074310302734375, 0.0029296875, 0.0132904052734375, 0.023651123046875, 0.0340118408203125, 0.04437255859375, 0.0547332763671875, 0.065093994140625, 0.0754547119140625, 0.0858154296875, 0.0961761474609375, 0.106536865234375, 0.1168975830078125, 0.12725830078125, 0.1376190185546875, 0.147979736328125, 0.1583404541015625, 0.168701171875, 0.1790618896484375, 0.189422607421875, 0.1997833251953125, 0.21014404296875, 0.2205047607421875, 0.230865478515625, 0.2412261962890625, 0.2515869140625, 0.2619476318359375, 0.272308349609375, 0.2826690673828125, 0.29302978515625, 0.3033905029296875, 0.313751220703125, 0.3241119384765625, 0.33447265625]}, "gradients/decoder.model.decoder.layers.2.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 3.0, 4.0, 1.0, 9.0, 13.0, 8.0, 13.0, 14.0, 12.0, 22.0, 28.0, 31.0, 33.0, 52.0, 48.0, 62.0, 75.0, 79.0, 91.0, 72.0, 63.0, 52.0, 47.0, 35.0, 20.0, 18.0, 13.0, 10.0, 15.0, 13.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08123779296875, -0.07841110229492188, -0.07558441162109375, -0.07275772094726562, -0.0699310302734375, -0.06710433959960938, -0.06427764892578125, -0.061450958251953125, -0.058624267578125, -0.055797576904296875, -0.05297088623046875, -0.050144195556640625, -0.0473175048828125, -0.044490814208984375, -0.04166412353515625, -0.038837432861328125, -0.0360107421875, -0.033184051513671875, -0.03035736083984375, -0.027530670166015625, -0.0247039794921875, -0.021877288818359375, -0.01905059814453125, -0.016223907470703125, -0.013397216796875, -0.010570526123046875, -0.00774383544921875, -0.004917144775390625, -0.0020904541015625, 0.000736236572265625, 0.00356292724609375, 0.006389617919921875, 0.00921630859375, 0.012042999267578125, 0.01486968994140625, 0.017696380615234375, 0.0205230712890625, 0.023349761962890625, 0.02617645263671875, 0.029003143310546875, 0.031829833984375, 0.034656524658203125, 0.03748321533203125, 0.040309906005859375, 0.0431365966796875, 0.045963287353515625, 0.04878997802734375, 0.051616668701171875, 0.054443359375, 0.057270050048828125, 0.06009674072265625, 0.06292343139648438, 0.0657501220703125, 0.06857681274414062, 0.07140350341796875, 0.07423019409179688, 0.077056884765625, 0.07988357543945312, 0.08271026611328125, 0.08553695678710938, 0.0883636474609375, 0.09119033813476562, 0.09401702880859375, 0.09684371948242188, 0.09967041015625]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 6.0, 9.0, 8.0, 12.0, 17.0, 20.0, 45.0, 49.0, 71.0, 81.0, 73.0, 82.0, 109.0, 85.0, 83.0, 58.0, 60.0, 41.0, 33.0, 23.0, 18.0, 7.0, 6.0, 8.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.153173446655273, -16.745393753051758, -16.337615966796875, -15.92983627319336, -15.52205753326416, -15.114277839660645, -14.706499099731445, -14.29871940612793, -13.89094066619873, -13.483161926269531, -13.075382232666016, -12.667603492736816, -12.259824752807617, -11.852045059204102, -11.444266319274902, -11.036487579345703, -10.628707885742188, -10.220929145812988, -9.813149452209473, -9.405370712280273, -8.997591972351074, -8.589812278747559, -8.18203353881836, -7.774254322052002, -7.366476058959961, -6.9586968421936035, -6.550918102264404, -6.143138885498047, -5.7353596687316895, -5.327580451965332, -4.919801712036133, -4.512022495269775, -4.104243278503418, -3.6964643001556396, -3.2886850833892822, -2.880906105041504, -2.4731268882751465, -2.065347909927368, -1.6575689315795898, -1.2497897148132324, -0.8420107364654541, -0.4342316687107086, -0.026452600955963135, 0.38132643699645996, 0.7891055345535278, 1.1968846321105957, 1.604663610458374, 2.0124428272247314, 2.4202218055725098, 2.828000783920288, 3.2357800006866455, 3.643558979034424, 4.051338195800781, 4.4591169357299805, 4.866896152496338, 5.274675369262695, 5.6824541091918945, 6.090233325958252, 6.498012065887451, 6.905791282653809, 7.313570499420166, 7.721349716186523, 8.129128456115723, 8.536907196044922, 8.944686889648438]}, "gradients/decoder.model.decoder.layers.2.self_attn_layer_norm.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 4.0, 9.0, 11.0, 9.0, 17.0, 9.0, 11.0, 19.0, 25.0, 21.0, 29.0, 28.0, 39.0, 31.0, 29.0, 36.0, 30.0, 38.0, 45.0, 32.0, 39.0, 42.0, 45.0, 33.0, 35.0, 38.0, 30.0, 29.0, 26.0, 31.0, 24.0, 21.0, 18.0, 18.0, 15.0, 15.0, 14.0, 7.0, 7.0, 7.0, 5.0, 5.0, 5.0, 2.0, 2.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.507257461547852, -6.279444694519043, -6.051631927490234, -5.823818683624268, -5.596005916595459, -5.36819314956665, -5.140380382537842, -4.912567138671875, -4.684754371643066, -4.456941604614258, -4.229128837585449, -4.001315593719482, -3.773502826690674, -3.5456900596618652, -3.3178772926330566, -3.090064287185669, -2.8622515201568604, -2.6344387531280518, -2.406625747680664, -2.1788129806518555, -1.9509999752044678, -1.7231872081756592, -1.495374321937561, -1.267561435699463, -1.0397485494613647, -0.8119356632232666, -0.5841227769851685, -0.3563099503517151, -0.12849706411361694, 0.09931576251983643, 0.32712864875793457, 0.5549415349960327, 0.7827544212341309, 1.010567307472229, 1.2383801937103271, 1.4661929607391357, 1.6940059661865234, 1.921818733215332, 2.1496315002441406, 2.3774445056915283, 2.605257511138916, 2.8330702781677246, 3.0608832836151123, 3.288696050643921, 3.5165090560913086, 3.744321823120117, 3.972134590148926, 4.199947357177734, 4.427760124206543, 4.655572891235352, 4.88338565826416, 5.111198902130127, 5.3390116691589355, 5.566824436187744, 5.794637203216553, 6.0224504470825195, 6.250263214111328, 6.478075981140137, 6.705888748168945, 6.933701992034912, 7.161514759063721, 7.389327526092529, 7.617140293121338, 7.844953536987305, 8.072766304016113]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 6.0, 8.0, 6.0, 13.0, 15.0, 36.0, 48.0, 81.0, 129.0, 241.0, 547.0, 1272.0, 3557.0, 10563.0, 37338.0, 189638.0, 639197.0, 125655.0, 27324.0, 8073.0, 2775.0, 1014.0, 447.0, 225.0, 142.0, 74.0, 43.0, 29.0, 20.0, 17.0, 8.0, 7.0, 7.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.78125, -16.3323974609375, -15.883544921875, -15.4346923828125, -14.98583984375, -14.5369873046875, -14.088134765625, -13.6392822265625, -13.1904296875, -12.7415771484375, -12.292724609375, -11.8438720703125, -11.39501953125, -10.9461669921875, -10.497314453125, -10.0484619140625, -9.599609375, -9.1507568359375, -8.701904296875, -8.2530517578125, -7.80419921875, -7.3553466796875, -6.906494140625, -6.4576416015625, -6.0087890625, -5.5599365234375, -5.111083984375, -4.6622314453125, -4.21337890625, -3.7645263671875, -3.315673828125, -2.8668212890625, -2.41796875, -1.9691162109375, -1.520263671875, -1.0714111328125, -0.62255859375, -0.1737060546875, 0.275146484375, 0.7239990234375, 1.1728515625, 1.6217041015625, 2.070556640625, 2.5194091796875, 2.96826171875, 3.4171142578125, 3.865966796875, 4.3148193359375, 4.763671875, 5.2125244140625, 5.661376953125, 6.1102294921875, 6.55908203125, 7.0079345703125, 7.456787109375, 7.9056396484375, 8.3544921875, 8.8033447265625, 9.252197265625, 9.7010498046875, 10.14990234375, 10.5987548828125, 11.047607421875, 11.4964599609375, 11.9453125]}, "gradients/decoder.model.decoder.layers.2.self_attn.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 5.0, 6.0, 13.0, 10.0, 15.0, 15.0, 12.0, 24.0, 22.0, 33.0, 17.0, 29.0, 33.0, 31.0, 43.0, 35.0, 49.0, 33.0, 36.0, 61.0, 37.0, 43.0, 48.0, 30.0, 36.0, 42.0, 45.0, 19.0, 24.0, 23.0, 15.0, 21.0, 18.0, 19.0, 11.0, 11.0, 6.0, 6.0, 8.0, 3.0, 8.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.3046875, -12.8558349609375, -12.406982421875, -11.9581298828125, -11.50927734375, -11.0604248046875, -10.611572265625, -10.1627197265625, -9.7138671875, -9.2650146484375, -8.816162109375, -8.3673095703125, -7.91845703125, -7.4696044921875, -7.020751953125, -6.5718994140625, -6.123046875, -5.6741943359375, -5.225341796875, -4.7764892578125, -4.32763671875, -3.8787841796875, -3.429931640625, -2.9810791015625, -2.5322265625, -2.0833740234375, -1.634521484375, -1.1856689453125, -0.73681640625, -0.2879638671875, 0.160888671875, 0.6097412109375, 1.05859375, 1.5074462890625, 1.956298828125, 2.4051513671875, 2.85400390625, 3.3028564453125, 3.751708984375, 4.2005615234375, 4.6494140625, 5.0982666015625, 5.547119140625, 5.9959716796875, 6.44482421875, 6.8936767578125, 7.342529296875, 7.7913818359375, 8.240234375, 8.6890869140625, 9.137939453125, 9.5867919921875, 10.03564453125, 10.4844970703125, 10.933349609375, 11.3822021484375, 11.8310546875, 12.2799072265625, 12.728759765625, 13.1776123046875, 13.62646484375, 14.0753173828125, 14.524169921875, 14.9730224609375, 15.421875]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 8.0, 19.0, 15.0, 8.0, 24.0, 29.0, 44.0, 39.0, 62.0, 84.0, 109.0, 173.0, 269.0, 480.0, 1465.0, 8147.0, 93378.0, 862035.0, 72523.0, 7023.0, 1289.0, 494.0, 243.0, 156.0, 105.0, 69.0, 66.0, 34.0, 25.0, 27.0, 20.0, 18.0, 11.0, 3.0, 8.0, 7.0, 7.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-25.53125, -24.74462890625, -23.9580078125, -23.17138671875, -22.384765625, -21.59814453125, -20.8115234375, -20.02490234375, -19.23828125, -18.45166015625, -17.6650390625, -16.87841796875, -16.091796875, -15.30517578125, -14.5185546875, -13.73193359375, -12.9453125, -12.15869140625, -11.3720703125, -10.58544921875, -9.798828125, -9.01220703125, -8.2255859375, -7.43896484375, -6.65234375, -5.86572265625, -5.0791015625, -4.29248046875, -3.505859375, -2.71923828125, -1.9326171875, -1.14599609375, -0.359375, 0.42724609375, 1.2138671875, 2.00048828125, 2.787109375, 3.57373046875, 4.3603515625, 5.14697265625, 5.93359375, 6.72021484375, 7.5068359375, 8.29345703125, 9.080078125, 9.86669921875, 10.6533203125, 11.43994140625, 12.2265625, 13.01318359375, 13.7998046875, 14.58642578125, 15.373046875, 16.15966796875, 16.9462890625, 17.73291015625, 18.51953125, 19.30615234375, 20.0927734375, 20.87939453125, 21.666015625, 22.45263671875, 23.2392578125, 24.02587890625, 24.8125]}, "gradients/decoder.model.decoder.layers.2.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 6.0, 7.0, 6.0, 12.0, 6.0, 11.0, 18.0, 27.0, 17.0, 23.0, 22.0, 32.0, 39.0, 39.0, 40.0, 49.0, 54.0, 45.0, 48.0, 39.0, 40.0, 49.0, 37.0, 54.0, 44.0, 34.0, 36.0, 35.0, 22.0, 22.0, 19.0, 14.0, 7.0, 7.0, 6.0, 4.0, 8.0, 3.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-19.03125, -18.46923828125, -17.9072265625, -17.34521484375, -16.783203125, -16.22119140625, -15.6591796875, -15.09716796875, -14.53515625, -13.97314453125, -13.4111328125, -12.84912109375, -12.287109375, -11.72509765625, -11.1630859375, -10.60107421875, -10.0390625, -9.47705078125, -8.9150390625, -8.35302734375, -7.791015625, -7.22900390625, -6.6669921875, -6.10498046875, -5.54296875, -4.98095703125, -4.4189453125, -3.85693359375, -3.294921875, -2.73291015625, -2.1708984375, -1.60888671875, -1.046875, -0.48486328125, 0.0771484375, 0.63916015625, 1.201171875, 1.76318359375, 2.3251953125, 2.88720703125, 3.44921875, 4.01123046875, 4.5732421875, 5.13525390625, 5.697265625, 6.25927734375, 6.8212890625, 7.38330078125, 7.9453125, 8.50732421875, 9.0693359375, 9.63134765625, 10.193359375, 10.75537109375, 11.3173828125, 11.87939453125, 12.44140625, 13.00341796875, 13.5654296875, 14.12744140625, 14.689453125, 15.25146484375, 15.8134765625, 16.37548828125, 16.9375]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 5.0, 6.0, 12.0, 7.0, 20.0, 15.0, 28.0, 46.0, 99.0, 232.0, 609.0, 1561.0, 5046.0, 33155.0, 846726.0, 146587.0, 10206.0, 2553.0, 914.0, 370.0, 157.0, 68.0, 32.0, 26.0, 16.0, 14.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.5625, -9.2611083984375, -8.959716796875, -8.6583251953125, -8.35693359375, -8.0555419921875, -7.754150390625, -7.4527587890625, -7.1513671875, -6.8499755859375, -6.548583984375, -6.2471923828125, -5.94580078125, -5.6444091796875, -5.343017578125, -5.0416259765625, -4.740234375, -4.4388427734375, -4.137451171875, -3.8360595703125, -3.53466796875, -3.2332763671875, -2.931884765625, -2.6304931640625, -2.3291015625, -2.0277099609375, -1.726318359375, -1.4249267578125, -1.12353515625, -0.8221435546875, -0.520751953125, -0.2193603515625, 0.08203125, 0.3834228515625, 0.684814453125, 0.9862060546875, 1.28759765625, 1.5889892578125, 1.890380859375, 2.1917724609375, 2.4931640625, 2.7945556640625, 3.095947265625, 3.3973388671875, 3.69873046875, 4.0001220703125, 4.301513671875, 4.6029052734375, 4.904296875, 5.2056884765625, 5.507080078125, 5.8084716796875, 6.10986328125, 6.4112548828125, 6.712646484375, 7.0140380859375, 7.3154296875, 7.6168212890625, 7.918212890625, 8.2196044921875, 8.52099609375, 8.8223876953125, 9.123779296875, 9.4251708984375, 9.7265625]}, "gradients/decoder.model.decoder.layers.2.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 8.0, 16.0, 15.0, 32.0, 65.0, 108.0, 220.0, 266.0, 129.0, 50.0, 30.0, 21.0, 17.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014066696166992188, -0.0013600140810012817, -0.0013133585453033447, -0.0012667030096054077, -0.0012200474739074707, -0.0011733919382095337, -0.0011267364025115967, -0.0010800808668136597, -0.0010334253311157227, -0.0009867697954177856, -0.0009401142597198486, -0.0008934587240219116, -0.0008468031883239746, -0.0008001476526260376, -0.0007534921169281006, -0.0007068365812301636, -0.0006601810455322266, -0.0006135255098342896, -0.0005668699741363525, -0.0005202144384384155, -0.0004735589027404785, -0.0004269033670425415, -0.0003802478313446045, -0.0003335922956466675, -0.00028693675994873047, -0.00024028122425079346, -0.00019362568855285645, -0.00014697015285491943, -0.00010031461715698242, -5.365908145904541e-05, -7.0035457611083984e-06, 3.965198993682861e-05, 8.630752563476562e-05, 0.00013296306133270264, 0.00017961859703063965, 0.00022627413272857666, 0.00027292966842651367, 0.0003195852041244507, 0.0003662407398223877, 0.0004128962755203247, 0.0004595518112182617, 0.0005062073469161987, 0.0005528628826141357, 0.0005995184183120728, 0.0006461739540100098, 0.0006928294897079468, 0.0007394850254058838, 0.0007861405611038208, 0.0008327960968017578, 0.0008794516324996948, 0.0009261071681976318, 0.0009727627038955688, 0.0010194182395935059, 0.0010660737752914429, 0.0011127293109893799, 0.001159384846687317, 0.001206040382385254, 0.001252695918083191, 0.001299351453781128, 0.001346006989479065, 0.001392662525177002, 0.001439318060874939, 0.001485973596572876, 0.001532629132270813, 0.00157928466796875]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 17.0, 26.0, 54.0, 100.0, 213.0, 453.0, 1091.0, 3444.0, 18425.0, 342147.0, 649363.0, 26684.0, 4265.0, 1271.0, 511.0, 248.0, 100.0, 56.0, 28.0, 19.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5234375, -9.2265625, -8.9296875, -8.6328125, -8.3359375, -8.0390625, -7.7421875, -7.4453125, -7.1484375, -6.8515625, -6.5546875, -6.2578125, -5.9609375, -5.6640625, -5.3671875, -5.0703125, -4.7734375, -4.4765625, -4.1796875, -3.8828125, -3.5859375, -3.2890625, -2.9921875, -2.6953125, -2.3984375, -2.1015625, -1.8046875, -1.5078125, -1.2109375, -0.9140625, -0.6171875, -0.3203125, -0.0234375, 0.2734375, 0.5703125, 0.8671875, 1.1640625, 1.4609375, 1.7578125, 2.0546875, 2.3515625, 2.6484375, 2.9453125, 3.2421875, 3.5390625, 3.8359375, 4.1328125, 4.4296875, 4.7265625, 5.0234375, 5.3203125, 5.6171875, 5.9140625, 6.2109375, 6.5078125, 6.8046875, 7.1015625, 7.3984375, 7.6953125, 7.9921875, 8.2890625, 8.5859375, 8.8828125, 9.1796875, 9.4765625]}, "gradients/decoder.model.decoder.layers.2.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 7.0, 12.0, 10.0, 15.0, 31.0, 39.0, 49.0, 62.0, 111.0, 211.0, 149.0, 81.0, 60.0, 37.0, 37.0, 20.0, 19.0, 13.0, 10.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.755859375, -2.676666259765625, -2.59747314453125, -2.518280029296875, -2.4390869140625, -2.359893798828125, -2.28070068359375, -2.201507568359375, -2.122314453125, -2.043121337890625, -1.96392822265625, -1.884735107421875, -1.8055419921875, -1.726348876953125, -1.64715576171875, -1.567962646484375, -1.48876953125, -1.409576416015625, -1.33038330078125, -1.251190185546875, -1.1719970703125, -1.092803955078125, -1.01361083984375, -0.934417724609375, -0.855224609375, -0.776031494140625, -0.69683837890625, -0.617645263671875, -0.5384521484375, -0.459259033203125, -0.38006591796875, -0.300872802734375, -0.2216796875, -0.142486572265625, -0.06329345703125, 0.015899658203125, 0.0950927734375, 0.174285888671875, 0.25347900390625, 0.332672119140625, 0.411865234375, 0.491058349609375, 0.57025146484375, 0.649444580078125, 0.7286376953125, 0.807830810546875, 0.88702392578125, 0.966217041015625, 1.04541015625, 1.124603271484375, 1.20379638671875, 1.282989501953125, 1.3621826171875, 1.441375732421875, 1.52056884765625, 1.599761962890625, 1.678955078125, 1.758148193359375, 1.83734130859375, 1.916534423828125, 1.9957275390625, 2.074920654296875, 2.15411376953125, 2.233306884765625, 2.3125]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 9.0, 18.0, 43.0, 105.0, 205.0, 254.0, 188.0, 124.0, 53.0, 9.0, 6.0, 2.0], "bins": [-128.43246459960938, -126.19764709472656, -123.96282958984375, -121.72801971435547, -119.49320220947266, -117.25838470458984, -115.02356719970703, -112.78875732421875, -110.55393981933594, -108.31912231445312, -106.08430480957031, -103.84949493408203, -101.61467742919922, -99.3798599243164, -97.1450424194336, -94.91023254394531, -92.6754150390625, -90.44059753417969, -88.20578002929688, -85.9709701538086, -83.73615264892578, -81.50133514404297, -79.26651763916016, -77.03170776367188, -74.79688262939453, -72.56206512451172, -70.3272476196289, -68.09243774414062, -65.85762023925781, -63.622802734375, -61.38798522949219, -59.15317153930664, -56.918357849121094, -54.68354034423828, -52.448726654052734, -50.21390914916992, -47.979095458984375, -45.74427795410156, -43.50946044921875, -41.2746467590332, -39.03982925415039, -36.80501174926758, -34.57019805908203, -32.33538055419922, -30.100566864013672, -27.86574935913086, -25.63093376159668, -23.3961181640625, -21.161304473876953, -18.926488876342773, -16.691673278808594, -14.456856727600098, -12.222041130065918, -9.987225532531738, -7.752408981323242, -5.5175933837890625, -3.2827768325805664, -1.0479609966278076, 1.1868548393249512, 3.421670913696289, 5.656486511230469, 7.891302108764648, 10.126118659973145, 12.360934257507324, 14.595749855041504]}, "gradients/decoder.model.decoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 5.0, 9.0, 6.0, 17.0, 11.0, 18.0, 21.0, 19.0, 21.0, 23.0, 28.0, 25.0, 33.0, 41.0, 28.0, 37.0, 32.0, 30.0, 34.0, 35.0, 50.0, 39.0, 38.0, 29.0, 43.0, 33.0, 40.0, 24.0, 24.0, 26.0, 20.0, 27.0, 15.0, 18.0, 15.0, 12.0, 18.0, 5.0, 8.0, 7.0, 5.0, 8.0, 3.0, 4.0, 0.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0], "bins": [-25.556262969970703, -24.779409408569336, -24.002553939819336, -23.22570037841797, -22.4488468170166, -21.6719913482666, -20.895137786865234, -20.118282318115234, -19.341428756713867, -18.5645751953125, -17.7877197265625, -17.010866165161133, -16.234012603759766, -15.457157135009766, -14.680303573608398, -13.903449058532715, -13.126595497131348, -12.349740982055664, -11.572887420654297, -10.796032905578613, -10.01917839050293, -9.242324829101562, -8.465470314025879, -7.688615798950195, -6.91176176071167, -6.1349077224731445, -5.358053207397461, -4.5811991691589355, -3.804344892501831, -3.0274906158447266, -2.250636577606201, -1.4737820625305176, -0.6969280242919922, 0.07992619276046753, 0.8567804098129272, 1.6336345672607422, 2.4104888439178467, 3.187343120574951, 3.9641971588134766, 4.74105167388916, 5.5179057121276855, 6.294759750366211, 7.0716142654418945, 7.84846830368042, 8.625322341918945, 9.402176856994629, 10.179031372070312, 10.95588493347168, 11.732739448547363, 12.509593963623047, 13.286447525024414, 14.063302040100098, 14.840156555175781, 15.617010116577148, 16.393863677978516, 17.170719146728516, 17.947572708129883, 18.72442626953125, 19.50128173828125, 20.278135299682617, 21.054988861083984, 21.831844329833984, 22.60869789123535, 23.38555145263672, 24.16240692138672]}, "gradients/decoder.model.decoder.layers.1.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 8.0, 10.0, 18.0, 30.0, 33.0, 43.0, 57.0, 88.0, 114.0, 211.0, 336.0, 731.0, 2284.0, 10734.0, 111886.0, 2259110.0, 1717777.0, 78695.0, 8595.0, 1888.0, 673.0, 325.0, 199.0, 124.0, 88.0, 60.0, 41.0, 32.0, 24.0, 19.0, 11.0, 5.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-28.234375, -27.490234375, -26.74609375, -26.001953125, -25.2578125, -24.513671875, -23.76953125, -23.025390625, -22.28125, -21.537109375, -20.79296875, -20.048828125, -19.3046875, -18.560546875, -17.81640625, -17.072265625, -16.328125, -15.583984375, -14.83984375, -14.095703125, -13.3515625, -12.607421875, -11.86328125, -11.119140625, -10.375, -9.630859375, -8.88671875, -8.142578125, -7.3984375, -6.654296875, -5.91015625, -5.166015625, -4.421875, -3.677734375, -2.93359375, -2.189453125, -1.4453125, -0.701171875, 0.04296875, 0.787109375, 1.53125, 2.275390625, 3.01953125, 3.763671875, 4.5078125, 5.251953125, 5.99609375, 6.740234375, 7.484375, 8.228515625, 8.97265625, 9.716796875, 10.4609375, 11.205078125, 11.94921875, 12.693359375, 13.4375, 14.181640625, 14.92578125, 15.669921875, 16.4140625, 17.158203125, 17.90234375, 18.646484375, 19.390625]}, "gradients/decoder.model.decoder.layers.1.fc2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 13.0, 11.0, 23.0, 26.0, 28.0, 33.0, 19.0, 39.0, 39.0, 36.0, 39.0, 40.0, 50.0, 43.0, 45.0, 43.0, 52.0, 46.0, 42.0, 45.0, 37.0, 28.0, 32.0, 31.0, 28.0, 18.0, 12.0, 12.0, 20.0, 11.0, 9.0, 7.0, 4.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.78515625, -7.49298095703125, -7.2008056640625, -6.90863037109375, -6.616455078125, -6.32427978515625, -6.0321044921875, -5.73992919921875, -5.44775390625, -5.15557861328125, -4.8634033203125, -4.57122802734375, -4.279052734375, -3.98687744140625, -3.6947021484375, -3.40252685546875, -3.1103515625, -2.81817626953125, -2.5260009765625, -2.23382568359375, -1.941650390625, -1.64947509765625, -1.3572998046875, -1.06512451171875, -0.77294921875, -0.48077392578125, -0.1885986328125, 0.10357666015625, 0.395751953125, 0.68792724609375, 0.9801025390625, 1.27227783203125, 1.564453125, 1.85662841796875, 2.1488037109375, 2.44097900390625, 2.733154296875, 3.02532958984375, 3.3175048828125, 3.60968017578125, 3.90185546875, 4.19403076171875, 4.4862060546875, 4.77838134765625, 5.070556640625, 5.36273193359375, 5.6549072265625, 5.94708251953125, 6.2392578125, 6.53143310546875, 6.8236083984375, 7.11578369140625, 7.407958984375, 7.70013427734375, 7.9923095703125, 8.28448486328125, 8.57666015625, 8.86883544921875, 9.1610107421875, 9.45318603515625, 9.745361328125, 10.03753662109375, 10.3297119140625, 10.62188720703125, 10.9140625]}, "gradients/decoder.model.decoder.layers.1.fc1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 5.0, 3.0, 9.0, 8.0, 18.0, 41.0, 53.0, 116.0, 295.0, 828.0, 2371.0, 13757.0, 495506.0, 3605586.0, 67929.0, 5513.0, 1325.0, 497.0, 192.0, 91.0, 45.0, 24.0, 23.0, 15.0, 11.0, 7.0, 5.0, 4.0, 4.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.0625, -27.06982421875, -26.0771484375, -25.08447265625, -24.091796875, -23.09912109375, -22.1064453125, -21.11376953125, -20.12109375, -19.12841796875, -18.1357421875, -17.14306640625, -16.150390625, -15.15771484375, -14.1650390625, -13.17236328125, -12.1796875, -11.18701171875, -10.1943359375, -9.20166015625, -8.208984375, -7.21630859375, -6.2236328125, -5.23095703125, -4.23828125, -3.24560546875, -2.2529296875, -1.26025390625, -0.267578125, 0.72509765625, 1.7177734375, 2.71044921875, 3.703125, 4.69580078125, 5.6884765625, 6.68115234375, 7.673828125, 8.66650390625, 9.6591796875, 10.65185546875, 11.64453125, 12.63720703125, 13.6298828125, 14.62255859375, 15.615234375, 16.60791015625, 17.6005859375, 18.59326171875, 19.5859375, 20.57861328125, 21.5712890625, 22.56396484375, 23.556640625, 24.54931640625, 25.5419921875, 26.53466796875, 27.52734375, 28.52001953125, 29.5126953125, 30.50537109375, 31.498046875, 32.49072265625, 33.4833984375, 34.47607421875, 35.46875]}, "gradients/decoder.model.decoder.layers.1.fc1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 9.0, 1.0, 8.0, 18.0, 19.0, 26.0, 39.0, 66.0, 68.0, 111.0, 176.0, 280.0, 362.0, 569.0, 574.0, 510.0, 391.0, 269.0, 201.0, 118.0, 72.0, 63.0, 26.0, 29.0, 18.0, 8.0, 11.0, 4.0, 9.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.14453125, -4.986572265625, -4.82861328125, -4.670654296875, -4.5126953125, -4.354736328125, -4.19677734375, -4.038818359375, -3.880859375, -3.722900390625, -3.56494140625, -3.406982421875, -3.2490234375, -3.091064453125, -2.93310546875, -2.775146484375, -2.6171875, -2.459228515625, -2.30126953125, -2.143310546875, -1.9853515625, -1.827392578125, -1.66943359375, -1.511474609375, -1.353515625, -1.195556640625, -1.03759765625, -0.879638671875, -0.7216796875, -0.563720703125, -0.40576171875, -0.247802734375, -0.08984375, 0.068115234375, 0.22607421875, 0.384033203125, 0.5419921875, 0.699951171875, 0.85791015625, 1.015869140625, 1.173828125, 1.331787109375, 1.48974609375, 1.647705078125, 1.8056640625, 1.963623046875, 2.12158203125, 2.279541015625, 2.4375, 2.595458984375, 2.75341796875, 2.911376953125, 3.0693359375, 3.227294921875, 3.38525390625, 3.543212890625, 3.701171875, 3.859130859375, 4.01708984375, 4.175048828125, 4.3330078125, 4.490966796875, 4.64892578125, 4.806884765625, 4.96484375]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 7.0, 4.0, 7.0, 16.0, 22.0, 24.0, 30.0, 56.0, 72.0, 79.0, 89.0, 90.0, 96.0, 79.0, 80.0, 73.0, 57.0, 47.0, 28.0, 21.0, 14.0, 9.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-28.78670883178711, -28.188976287841797, -27.591243743896484, -26.993511199951172, -26.39577865600586, -25.798046112060547, -25.200313568115234, -24.602582931518555, -24.004850387573242, -23.40711784362793, -22.809385299682617, -22.211652755737305, -21.613920211791992, -21.016189575195312, -20.41845703125, -19.820724487304688, -19.222991943359375, -18.625259399414062, -18.02752685546875, -17.429794311523438, -16.832061767578125, -16.234329223632812, -15.636597633361816, -15.03886604309082, -14.441131591796875, -13.843399047851562, -13.24566650390625, -12.647933959960938, -12.050202369689941, -11.452469825744629, -10.854737281799316, -10.25700569152832, -9.659272193908691, -9.061539649963379, -8.463807106018066, -7.866075038909912, -7.268342971801758, -6.670610427856445, -6.072877883911133, -5.4751458168029785, -4.877413272857666, -4.2796807289123535, -3.681948661804199, -3.0842161178588867, -2.4864838123321533, -1.88875150680542, -1.2910189628601074, -0.6932868957519531, -0.09555435180664062, 0.5021780133247375, 1.0999103784561157, 1.6976428031921387, 2.295375108718872, 2.8931074142456055, 3.490839958190918, 4.088572025299072, 4.686304569244385, 5.284037113189697, 5.881769180297852, 6.479501724243164, 7.077234268188477, 7.674966335296631, 8.272699356079102, 8.870430946350098, 9.46816349029541]}, "gradients/decoder.model.decoder.layers.1.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 6.0, 9.0, 9.0, 11.0, 8.0, 12.0, 17.0, 11.0, 15.0, 22.0, 26.0, 23.0, 23.0, 22.0, 31.0, 27.0, 40.0, 23.0, 30.0, 28.0, 39.0, 43.0, 33.0, 39.0, 33.0, 41.0, 36.0, 30.0, 32.0, 33.0, 28.0, 23.0, 24.0, 29.0, 16.0, 20.0, 16.0, 13.0, 8.0, 12.0, 7.0, 14.0, 10.0, 4.0, 10.0, 6.0, 3.0, 3.0, 2.0, 3.0, 3.0], "bins": [-10.416826248168945, -10.121781349182129, -9.826736450195312, -9.531691551208496, -9.23664665222168, -8.941601753234863, -8.646556854248047, -8.351512908935547, -8.056467056274414, -7.761422157287598, -7.466377258300781, -7.171332359313965, -6.876287460327148, -6.581242561340332, -6.286198139190674, -5.991153240203857, -5.696108818054199, -5.401063919067383, -5.106019020080566, -4.81097412109375, -4.515929222106934, -4.220884323120117, -3.925839900970459, -3.6307950019836426, -3.335750102996826, -3.0407052040100098, -2.7456603050231934, -2.450615644454956, -2.1555707454681396, -1.8605258464813232, -1.5654810667037964, -1.2704362869262695, -0.9753904342651367, -0.6803455948829651, -0.38530075550079346, -0.09025591611862183, 0.2047889232635498, 0.4998338222503662, 0.7948786020278931, 1.08992338180542, 1.3849682807922363, 1.6800131797790527, 1.9750579595565796, 2.2701027393341064, 2.565147638320923, 2.8601925373077393, 3.1552371978759766, 3.450282096862793, 3.7453269958496094, 4.040371894836426, 4.335416793823242, 4.630461692810059, 4.925506591796875, 5.220551490783691, 5.51559591293335, 5.810640811920166, 6.105685710906982, 6.400730609893799, 6.695775508880615, 6.990820407867432, 7.28586483001709, 7.580909729003906, 7.875954627990723, 8.170999526977539, 8.466044425964355]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 5.0, 6.0, 17.0, 18.0, 26.0, 37.0, 67.0, 83.0, 113.0, 202.0, 446.0, 1077.0, 3079.0, 10510.0, 50066.0, 278778.0, 530600.0, 138272.0, 25672.0, 5949.0, 1903.0, 791.0, 349.0, 170.0, 96.0, 63.0, 54.0, 21.0, 25.0, 22.0, 20.0, 8.0, 7.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.46484375, -4.354034423828125, -4.24322509765625, -4.132415771484375, -4.0216064453125, -3.910797119140625, -3.79998779296875, -3.689178466796875, -3.578369140625, -3.467559814453125, -3.35675048828125, -3.245941162109375, -3.1351318359375, -3.024322509765625, -2.91351318359375, -2.802703857421875, -2.69189453125, -2.581085205078125, -2.47027587890625, -2.359466552734375, -2.2486572265625, -2.137847900390625, -2.02703857421875, -1.916229248046875, -1.805419921875, -1.694610595703125, -1.58380126953125, -1.472991943359375, -1.3621826171875, -1.251373291015625, -1.14056396484375, -1.029754638671875, -0.9189453125, -0.808135986328125, -0.69732666015625, -0.586517333984375, -0.4757080078125, -0.364898681640625, -0.25408935546875, -0.143280029296875, -0.032470703125, 0.078338623046875, 0.18914794921875, 0.299957275390625, 0.4107666015625, 0.521575927734375, 0.63238525390625, 0.743194580078125, 0.85400390625, 0.964813232421875, 1.07562255859375, 1.186431884765625, 1.2972412109375, 1.408050537109375, 1.51885986328125, 1.629669189453125, 1.740478515625, 1.851287841796875, 1.96209716796875, 2.072906494140625, 2.1837158203125, 2.294525146484375, 2.40533447265625, 2.516143798828125, 2.626953125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 9.0, 14.0, 17.0, 16.0, 29.0, 27.0, 26.0, 28.0, 40.0, 42.0, 61.0, 47.0, 49.0, 49.0, 45.0, 56.0, 60.0, 59.0, 53.0, 37.0, 34.0, 50.0, 22.0, 24.0, 22.0, 13.0, 12.0, 15.0, 11.0, 12.0, 12.0, 4.0, 3.0, 6.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.6953125, -10.43218994140625, -10.1690673828125, -9.90594482421875, -9.642822265625, -9.37969970703125, -9.1165771484375, -8.85345458984375, -8.59033203125, -8.32720947265625, -8.0640869140625, -7.80096435546875, -7.537841796875, -7.27471923828125, -7.0115966796875, -6.74847412109375, -6.4853515625, -6.22222900390625, -5.9591064453125, -5.69598388671875, -5.432861328125, -5.16973876953125, -4.9066162109375, -4.64349365234375, -4.38037109375, -4.11724853515625, -3.8541259765625, -3.59100341796875, -3.327880859375, -3.06475830078125, -2.8016357421875, -2.53851318359375, -2.275390625, -2.01226806640625, -1.7491455078125, -1.48602294921875, -1.222900390625, -0.95977783203125, -0.6966552734375, -0.43353271484375, -0.17041015625, 0.09271240234375, 0.3558349609375, 0.61895751953125, 0.882080078125, 1.14520263671875, 1.4083251953125, 1.67144775390625, 1.9345703125, 2.19769287109375, 2.4608154296875, 2.72393798828125, 2.987060546875, 3.25018310546875, 3.5133056640625, 3.77642822265625, 4.03955078125, 4.30267333984375, 4.5657958984375, 4.82891845703125, 5.092041015625, 5.35516357421875, 5.6182861328125, 5.88140869140625, 6.14453125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 5.0, 7.0, 11.0, 21.0, 33.0, 53.0, 85.0, 130.0, 213.0, 391.0, 585.0, 938.0, 1496.0, 2534.0, 4332.0, 7641.0, 12958.0, 22848.0, 40203.0, 69389.0, 116565.0, 172597.0, 196774.0, 156367.0, 101454.0, 59650.0, 34178.0, 19728.0, 11302.0, 6554.0, 3743.0, 2308.0, 1325.0, 786.0, 503.0, 315.0, 180.0, 114.0, 95.0, 53.0, 30.0, 33.0, 7.0, 8.0, 7.0, 1.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8046875, -0.7781906127929688, -0.7516937255859375, -0.7251968383789062, -0.698699951171875, -0.6722030639648438, -0.6457061767578125, -0.6192092895507812, -0.59271240234375, -0.5662155151367188, -0.5397186279296875, -0.5132217407226562, -0.486724853515625, -0.46022796630859375, -0.4337310791015625, -0.40723419189453125, -0.3807373046875, -0.35424041748046875, -0.3277435302734375, -0.30124664306640625, -0.274749755859375, -0.24825286865234375, -0.2217559814453125, -0.19525909423828125, -0.16876220703125, -0.14226531982421875, -0.1157684326171875, -0.08927154541015625, -0.062774658203125, -0.03627777099609375, -0.0097808837890625, 0.01671600341796875, 0.043212890625, 0.06970977783203125, 0.0962066650390625, 0.12270355224609375, 0.149200439453125, 0.17569732666015625, 0.2021942138671875, 0.22869110107421875, 0.25518798828125, 0.28168487548828125, 0.3081817626953125, 0.33467864990234375, 0.361175537109375, 0.38767242431640625, 0.4141693115234375, 0.44066619873046875, 0.4671630859375, 0.49365997314453125, 0.5201568603515625, 0.5466537475585938, 0.573150634765625, 0.5996475219726562, 0.6261444091796875, 0.6526412963867188, 0.67913818359375, 0.7056350708007812, 0.7321319580078125, 0.7586288452148438, 0.785125732421875, 0.8116226196289062, 0.8381195068359375, 0.8646163940429688, 0.89111328125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 3.0, 3.0, 2.0, 5.0, 6.0, 3.0, 15.0, 13.0, 12.0, 19.0, 17.0, 20.0, 28.0, 25.0, 30.0, 24.0, 40.0, 30.0, 52.0, 53.0, 47.0, 37.0, 45.0, 55.0, 39.0, 49.0, 34.0, 33.0, 32.0, 29.0, 27.0, 26.0, 23.0, 21.0, 22.0, 12.0, 9.0, 12.0, 7.0, 7.0, 7.0, 7.0, 6.0, 3.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-12.28125, -11.8824462890625, -11.483642578125, -11.0848388671875, -10.68603515625, -10.2872314453125, -9.888427734375, -9.4896240234375, -9.0908203125, -8.6920166015625, -8.293212890625, -7.8944091796875, -7.49560546875, -7.0968017578125, -6.697998046875, -6.2991943359375, -5.900390625, -5.5015869140625, -5.102783203125, -4.7039794921875, -4.30517578125, -3.9063720703125, -3.507568359375, -3.1087646484375, -2.7099609375, -2.3111572265625, -1.912353515625, -1.5135498046875, -1.11474609375, -0.7159423828125, -0.317138671875, 0.0816650390625, 0.48046875, 0.8792724609375, 1.278076171875, 1.6768798828125, 2.07568359375, 2.4744873046875, 2.873291015625, 3.2720947265625, 3.6708984375, 4.0697021484375, 4.468505859375, 4.8673095703125, 5.26611328125, 5.6649169921875, 6.063720703125, 6.4625244140625, 6.861328125, 7.2601318359375, 7.658935546875, 8.0577392578125, 8.45654296875, 8.8553466796875, 9.254150390625, 9.6529541015625, 10.0517578125, 10.4505615234375, 10.849365234375, 11.2481689453125, 11.64697265625, 12.0457763671875, 12.444580078125, 12.8433837890625, 13.2421875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 10.0, 10.0, 13.0, 21.0, 22.0, 30.0, 34.0, 53.0, 75.0, 128.0, 218.0, 515.0, 1250.0, 4083.0, 20292.0, 199480.0, 706411.0, 99329.0, 12121.0, 2695.0, 828.0, 404.0, 193.0, 84.0, 65.0, 50.0, 39.0, 25.0, 13.0, 15.0, 11.0, 9.0, 6.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5244140625, -0.50714111328125, -0.4898681640625, -0.47259521484375, -0.455322265625, -0.43804931640625, -0.4207763671875, -0.40350341796875, -0.38623046875, -0.36895751953125, -0.3516845703125, -0.33441162109375, -0.317138671875, -0.29986572265625, -0.2825927734375, -0.26531982421875, -0.248046875, -0.23077392578125, -0.2135009765625, -0.19622802734375, -0.178955078125, -0.16168212890625, -0.1444091796875, -0.12713623046875, -0.10986328125, -0.09259033203125, -0.0753173828125, -0.05804443359375, -0.040771484375, -0.02349853515625, -0.0062255859375, 0.01104736328125, 0.0283203125, 0.04559326171875, 0.0628662109375, 0.08013916015625, 0.097412109375, 0.11468505859375, 0.1319580078125, 0.14923095703125, 0.16650390625, 0.18377685546875, 0.2010498046875, 0.21832275390625, 0.235595703125, 0.25286865234375, 0.2701416015625, 0.28741455078125, 0.3046875, 0.32196044921875, 0.3392333984375, 0.35650634765625, 0.373779296875, 0.39105224609375, 0.4083251953125, 0.42559814453125, 0.44287109375, 0.46014404296875, 0.4774169921875, 0.49468994140625, 0.511962890625, 0.52923583984375, 0.5465087890625, 0.56378173828125, 0.5810546875]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 10.0, 13.0, 22.0, 42.0, 58.0, 82.0, 146.0, 157.0, 163.0, 116.0, 74.0, 44.0, 27.0, 22.0, 12.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0], "bins": [-0.00048279762268066406, -0.00047329626977443695, -0.00046379491686820984, -0.0004542935639619827, -0.0004447922110557556, -0.0004352908581495285, -0.0004257895052433014, -0.0004162881523370743, -0.00040678679943084717, -0.00039728544652462006, -0.00038778409361839294, -0.00037828274071216583, -0.0003687813878059387, -0.0003592800348997116, -0.0003497786819934845, -0.0003402773290872574, -0.0003307759761810303, -0.00032127462327480316, -0.00031177327036857605, -0.00030227191746234894, -0.0002927705645561218, -0.0002832692116498947, -0.0002737678587436676, -0.0002642665058374405, -0.0002547651529312134, -0.00024526380002498627, -0.00023576244711875916, -0.00022626109421253204, -0.00021675974130630493, -0.00020725838840007782, -0.0001977570354938507, -0.0001882556825876236, -0.00017875432968139648, -0.00016925297677516937, -0.00015975162386894226, -0.00015025027096271515, -0.00014074891805648804, -0.00013124756515026093, -0.00012174621224403381, -0.0001122448593378067, -0.00010274350643157959, -9.324215352535248e-05, -8.374080061912537e-05, -7.423944771289825e-05, -6.473809480667114e-05, -5.523674190044403e-05, -4.573538899421692e-05, -3.623403608798981e-05, -2.6732683181762695e-05, -1.7231330275535583e-05, -7.729977369308472e-06, 1.7713755369186401e-06, 1.1272728443145752e-05, 2.0774081349372864e-05, 3.0275434255599976e-05, 3.977678716182709e-05, 4.92781400680542e-05, 5.877949297428131e-05, 6.828084588050842e-05, 7.778219878673553e-05, 8.728355169296265e-05, 9.678490459918976e-05, 0.00010628625750541687, 0.00011578761041164398, 0.0001252889633178711]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 6.0, 10.0, 8.0, 19.0, 26.0, 79.0, 141.0, 326.0, 1157.0, 4995.0, 47414.0, 809575.0, 171474.0, 10513.0, 1929.0, 545.0, 179.0, 78.0, 38.0, 21.0, 15.0, 3.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0400390625, -1.0116958618164062, -0.9833526611328125, -0.9550094604492188, -0.926666259765625, -0.8983230590820312, -0.8699798583984375, -0.8416366577148438, -0.81329345703125, -0.7849502563476562, -0.7566070556640625, -0.7282638549804688, -0.699920654296875, -0.6715774536132812, -0.6432342529296875, -0.6148910522460938, -0.5865478515625, -0.5582046508789062, -0.5298614501953125, -0.5015182495117188, -0.473175048828125, -0.44483184814453125, -0.4164886474609375, -0.38814544677734375, -0.35980224609375, -0.33145904541015625, -0.3031158447265625, -0.27477264404296875, -0.246429443359375, -0.21808624267578125, -0.1897430419921875, -0.16139984130859375, -0.133056640625, -0.10471343994140625, -0.0763702392578125, -0.04802703857421875, -0.019683837890625, 0.00865936279296875, 0.0370025634765625, 0.06534576416015625, 0.09368896484375, 0.12203216552734375, 0.1503753662109375, 0.17871856689453125, 0.207061767578125, 0.23540496826171875, 0.2637481689453125, 0.29209136962890625, 0.3204345703125, 0.34877777099609375, 0.3771209716796875, 0.40546417236328125, 0.433807373046875, 0.46215057373046875, 0.4904937744140625, 0.5188369750976562, 0.54718017578125, 0.5755233764648438, 0.6038665771484375, 0.6322097778320312, 0.660552978515625, 0.6888961791992188, 0.7172393798828125, 0.7455825805664062, 0.77392578125]}, "gradients/decoder.model.decoder.layers.1.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 2.0, 7.0, 16.0, 28.0, 39.0, 64.0, 100.0, 136.0, 184.0, 155.0, 102.0, 59.0, 35.0, 23.0, 11.0, 8.0, 9.0, 2.0, 4.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12890625, -0.12317276000976562, -0.11743927001953125, -0.11170578002929688, -0.1059722900390625, -0.10023880004882812, -0.09450531005859375, -0.08877182006835938, -0.083038330078125, -0.07730484008789062, -0.07157135009765625, -0.06583786010742188, -0.0601043701171875, -0.054370880126953125, -0.04863739013671875, -0.042903900146484375, -0.03717041015625, -0.031436920166015625, -0.02570343017578125, -0.019969940185546875, -0.0142364501953125, -0.008502960205078125, -0.00276947021484375, 0.002964019775390625, 0.008697509765625, 0.014430999755859375, 0.02016448974609375, 0.025897979736328125, 0.0316314697265625, 0.037364959716796875, 0.04309844970703125, 0.048831939697265625, 0.0545654296875, 0.060298919677734375, 0.06603240966796875, 0.07176589965820312, 0.0774993896484375, 0.08323287963867188, 0.08896636962890625, 0.09469985961914062, 0.100433349609375, 0.10616683959960938, 0.11190032958984375, 0.11763381958007812, 0.1233673095703125, 0.12910079956054688, 0.13483428955078125, 0.14056777954101562, 0.14630126953125, 0.15203475952148438, 0.15776824951171875, 0.16350173950195312, 0.1692352294921875, 0.17496871948242188, 0.18070220947265625, 0.18643569946289062, 0.192169189453125, 0.19790267944335938, 0.20363616943359375, 0.20936965942382812, 0.2151031494140625, 0.22083663940429688, 0.22657012939453125, 0.23230361938476562, 0.238037109375]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 5.0, 10.0, 15.0, 20.0, 23.0, 48.0, 49.0, 58.0, 80.0, 84.0, 103.0, 94.0, 64.0, 82.0, 70.0, 52.0, 54.0, 27.0, 15.0, 24.0, 9.0, 7.0, 8.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.528404235839844, -11.200311660766602, -10.87221908569336, -10.544126510620117, -10.216033935546875, -9.887941360473633, -9.55984878540039, -9.231756210327148, -8.903663635253906, -8.575571060180664, -8.247478485107422, -7.91938591003418, -7.5912933349609375, -7.263200759887695, -6.935108184814453, -6.607015609741211, -6.2789225578308105, -5.950829982757568, -5.622737407684326, -5.294644832611084, -4.966552257537842, -4.6384596824646, -4.310366630554199, -3.982274293899536, -3.654181718826294, -3.3260891437530518, -2.9979965686798096, -2.6699037551879883, -2.341811180114746, -2.013718605041504, -1.6856260299682617, -1.3575334548950195, -1.0294408798217773, -0.7013483047485352, -0.3732556700706482, -0.04516303539276123, 0.28292953968048096, 0.6110221147537231, 0.9391148090362549, 1.267207384109497, 1.5952999591827393, 1.9233925342559814, 2.2514851093292236, 2.579577922821045, 2.907670497894287, 3.2357630729675293, 3.5638556480407715, 3.8919482231140137, 4.220040798187256, 4.548133373260498, 4.87622594833374, 5.204318523406982, 5.532411098480225, 5.860503673553467, 6.188596725463867, 6.516689300537109, 6.844781875610352, 7.172874450683594, 7.500967025756836, 7.829059600830078, 8.15715217590332, 8.485244750976562, 8.813337326049805, 9.141429901123047, 9.469522476196289]}, "gradients/decoder.model.decoder.layers.1.self_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 15.0, 9.0, 22.0, 16.0, 21.0, 27.0, 28.0, 39.0, 45.0, 43.0, 50.0, 42.0, 46.0, 59.0, 54.0, 65.0, 52.0, 56.0, 44.0, 45.0, 37.0, 42.0, 21.0, 25.0, 19.0, 13.0, 18.0, 14.0, 12.0, 7.0, 7.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.461812019348145, -10.202860832214355, -9.943910598754883, -9.684959411621094, -9.426009178161621, -9.167057991027832, -8.90810775756836, -8.64915657043457, -8.390206336975098, -8.131255149841309, -7.872304916381836, -7.613354206085205, -7.354403495788574, -7.095452785491943, -6.8365020751953125, -6.577550888061523, -6.318600177764893, -6.059649467468262, -5.800698757171631, -5.541748046875, -5.282797336578369, -5.023846626281738, -4.764895439147949, -4.505945205688477, -4.2469940185546875, -3.9880433082580566, -3.729092597961426, -3.470141887664795, -3.211191177368164, -2.952240467071533, -2.6932895183563232, -2.4343388080596924, -2.1753878593444824, -1.9164371490478516, -1.6574864387512207, -1.3985356092453003, -1.1395848989486694, -0.8806341886520386, -0.6216833591461182, -0.3627326488494873, -0.10378193855285645, 0.1551688015460968, 0.41411954164505005, 0.6730703115463257, 0.9320210218429565, 1.1909717321395874, 1.4499225616455078, 1.7088732719421387, 1.9678239822387695, 2.2267746925354004, 2.4857254028320312, 2.744676113128662, 3.003626823425293, 3.262577533721924, 3.521528482437134, 3.7804791927337646, 4.039429664611816, 4.298380374908447, 4.557331085205078, 4.816281795501709, 5.07523250579834, 5.334183216094971, 5.593133926391602, 5.852085113525391, 6.1110358238220215]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 3.0, 5.0, 10.0, 19.0, 17.0, 46.0, 65.0, 83.0, 158.0, 273.0, 448.0, 851.0, 1768.0, 4609.0, 12500.0, 35891.0, 103040.0, 290680.0, 370056.0, 148029.0, 50764.0, 17909.0, 6392.0, 2559.0, 1132.0, 542.0, 282.0, 168.0, 104.0, 45.0, 31.0, 26.0, 20.0, 10.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-11.6640625, -11.35845947265625, -11.0528564453125, -10.74725341796875, -10.441650390625, -10.13604736328125, -9.8304443359375, -9.52484130859375, -9.21923828125, -8.91363525390625, -8.6080322265625, -8.30242919921875, -7.996826171875, -7.69122314453125, -7.3856201171875, -7.08001708984375, -6.7744140625, -6.46881103515625, -6.1632080078125, -5.85760498046875, -5.552001953125, -5.24639892578125, -4.9407958984375, -4.63519287109375, -4.32958984375, -4.02398681640625, -3.7183837890625, -3.41278076171875, -3.107177734375, -2.80157470703125, -2.4959716796875, -2.19036865234375, -1.884765625, -1.57916259765625, -1.2735595703125, -0.96795654296875, -0.662353515625, -0.35675048828125, -0.0511474609375, 0.25445556640625, 0.56005859375, 0.86566162109375, 1.1712646484375, 1.47686767578125, 1.782470703125, 2.08807373046875, 2.3936767578125, 2.69927978515625, 3.0048828125, 3.31048583984375, 3.6160888671875, 3.92169189453125, 4.227294921875, 4.53289794921875, 4.8385009765625, 5.14410400390625, 5.44970703125, 5.75531005859375, 6.0609130859375, 6.36651611328125, 6.672119140625, 6.97772216796875, 7.2833251953125, 7.58892822265625, 7.89453125]}, "gradients/decoder.model.decoder.layers.1.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 5.0, 4.0, 10.0, 8.0, 9.0, 7.0, 23.0, 21.0, 29.0, 32.0, 28.0, 41.0, 51.0, 54.0, 52.0, 58.0, 52.0, 76.0, 58.0, 58.0, 50.0, 51.0, 38.0, 43.0, 25.0, 26.0, 26.0, 30.0, 11.0, 7.0, 14.0, 5.0, 7.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.640625, -20.08544921875, -19.5302734375, -18.97509765625, -18.419921875, -17.86474609375, -17.3095703125, -16.75439453125, -16.19921875, -15.64404296875, -15.0888671875, -14.53369140625, -13.978515625, -13.42333984375, -12.8681640625, -12.31298828125, -11.7578125, -11.20263671875, -10.6474609375, -10.09228515625, -9.537109375, -8.98193359375, -8.4267578125, -7.87158203125, -7.31640625, -6.76123046875, -6.2060546875, -5.65087890625, -5.095703125, -4.54052734375, -3.9853515625, -3.43017578125, -2.875, -2.31982421875, -1.7646484375, -1.20947265625, -0.654296875, -0.09912109375, 0.4560546875, 1.01123046875, 1.56640625, 2.12158203125, 2.6767578125, 3.23193359375, 3.787109375, 4.34228515625, 4.8974609375, 5.45263671875, 6.0078125, 6.56298828125, 7.1181640625, 7.67333984375, 8.228515625, 8.78369140625, 9.3388671875, 9.89404296875, 10.44921875, 11.00439453125, 11.5595703125, 12.11474609375, 12.669921875, 13.22509765625, 13.7802734375, 14.33544921875, 14.890625]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 0.0, 5.0, 1.0, 7.0, 9.0, 7.0, 11.0, 16.0, 22.0, 20.0, 27.0, 25.0, 42.0, 53.0, 82.0, 100.0, 150.0, 235.0, 382.0, 762.0, 1979.0, 7403.0, 37092.0, 203101.0, 573892.0, 180842.0, 32198.0, 6506.0, 1786.0, 731.0, 329.0, 214.0, 136.0, 102.0, 72.0, 54.0, 39.0, 19.0, 25.0, 17.0, 9.0, 14.0, 13.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-14.5234375, -14.061767578125, -13.60009765625, -13.138427734375, -12.6767578125, -12.215087890625, -11.75341796875, -11.291748046875, -10.830078125, -10.368408203125, -9.90673828125, -9.445068359375, -8.9833984375, -8.521728515625, -8.06005859375, -7.598388671875, -7.13671875, -6.675048828125, -6.21337890625, -5.751708984375, -5.2900390625, -4.828369140625, -4.36669921875, -3.905029296875, -3.443359375, -2.981689453125, -2.52001953125, -2.058349609375, -1.5966796875, -1.135009765625, -0.67333984375, -0.211669921875, 0.25, 0.711669921875, 1.17333984375, 1.635009765625, 2.0966796875, 2.558349609375, 3.02001953125, 3.481689453125, 3.943359375, 4.405029296875, 4.86669921875, 5.328369140625, 5.7900390625, 6.251708984375, 6.71337890625, 7.175048828125, 7.63671875, 8.098388671875, 8.56005859375, 9.021728515625, 9.4833984375, 9.945068359375, 10.40673828125, 10.868408203125, 11.330078125, 11.791748046875, 12.25341796875, 12.715087890625, 13.1767578125, 13.638427734375, 14.10009765625, 14.561767578125, 15.0234375]}, "gradients/decoder.model.decoder.layers.1.self_attn.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 4.0, 10.0, 16.0, 8.0, 27.0, 20.0, 34.0, 34.0, 32.0, 33.0, 33.0, 41.0, 54.0, 44.0, 41.0, 54.0, 46.0, 55.0, 38.0, 58.0, 45.0, 47.0, 46.0, 27.0, 28.0, 15.0, 16.0, 18.0, 7.0, 9.0, 11.0, 7.0, 7.0, 2.0, 5.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.671875, -16.131591796875, -15.59130859375, -15.051025390625, -14.5107421875, -13.970458984375, -13.43017578125, -12.889892578125, -12.349609375, -11.809326171875, -11.26904296875, -10.728759765625, -10.1884765625, -9.648193359375, -9.10791015625, -8.567626953125, -8.02734375, -7.487060546875, -6.94677734375, -6.406494140625, -5.8662109375, -5.325927734375, -4.78564453125, -4.245361328125, -3.705078125, -3.164794921875, -2.62451171875, -2.084228515625, -1.5439453125, -1.003662109375, -0.46337890625, 0.076904296875, 0.6171875, 1.157470703125, 1.69775390625, 2.238037109375, 2.7783203125, 3.318603515625, 3.85888671875, 4.399169921875, 4.939453125, 5.479736328125, 6.02001953125, 6.560302734375, 7.1005859375, 7.640869140625, 8.18115234375, 8.721435546875, 9.26171875, 9.802001953125, 10.34228515625, 10.882568359375, 11.4228515625, 11.963134765625, 12.50341796875, 13.043701171875, 13.583984375, 14.124267578125, 14.66455078125, 15.204833984375, 15.7451171875, 16.285400390625, 16.82568359375, 17.365966796875, 17.90625]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 7.0, 7.0, 3.0, 5.0, 14.0, 18.0, 14.0, 27.0, 72.0, 166.0, 401.0, 1221.0, 5103.0, 51286.0, 739954.0, 232800.0, 13937.0, 2397.0, 663.0, 263.0, 92.0, 36.0, 31.0, 13.0, 16.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.79296875, -6.55670166015625, -6.3204345703125, -6.08416748046875, -5.847900390625, -5.61163330078125, -5.3753662109375, -5.13909912109375, -4.90283203125, -4.66656494140625, -4.4302978515625, -4.19403076171875, -3.957763671875, -3.72149658203125, -3.4852294921875, -3.24896240234375, -3.0126953125, -2.77642822265625, -2.5401611328125, -2.30389404296875, -2.067626953125, -1.83135986328125, -1.5950927734375, -1.35882568359375, -1.12255859375, -0.88629150390625, -0.6500244140625, -0.41375732421875, -0.177490234375, 0.05877685546875, 0.2950439453125, 0.53131103515625, 0.767578125, 1.00384521484375, 1.2401123046875, 1.47637939453125, 1.712646484375, 1.94891357421875, 2.1851806640625, 2.42144775390625, 2.65771484375, 2.89398193359375, 3.1302490234375, 3.36651611328125, 3.602783203125, 3.83905029296875, 4.0753173828125, 4.31158447265625, 4.5478515625, 4.78411865234375, 5.0203857421875, 5.25665283203125, 5.492919921875, 5.72918701171875, 5.9654541015625, 6.20172119140625, 6.43798828125, 6.67425537109375, 6.9105224609375, 7.14678955078125, 7.383056640625, 7.61932373046875, 7.8555908203125, 8.09185791015625, 8.328125]}, "gradients/decoder.model.decoder.layers.1.self_attn.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 2.0, 9.0, 10.0, 11.0, 24.0, 27.0, 50.0, 84.0, 113.0, 183.0, 181.0, 120.0, 74.0, 40.0, 31.0, 16.0, 9.0, 6.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013437271118164062, -0.0013029277324676514, -0.0012621283531188965, -0.0012213289737701416, -0.0011805295944213867, -0.0011397302150726318, -0.001098930835723877, -0.001058131456375122, -0.0010173320770263672, -0.0009765326976776123, -0.0009357333183288574, -0.0008949339389801025, -0.0008541345596313477, -0.0008133351802825928, -0.0007725358009338379, -0.000731736421585083, -0.0006909370422363281, -0.0006501376628875732, -0.0006093382835388184, -0.0005685389041900635, -0.0005277395248413086, -0.0004869401454925537, -0.00044614076614379883, -0.00040534138679504395, -0.00036454200744628906, -0.0003237426280975342, -0.0002829432487487793, -0.00024214386940002441, -0.00020134449005126953, -0.00016054511070251465, -0.00011974573135375977, -7.894635200500488e-05, -3.814697265625e-05, 2.652406692504883e-06, 4.3451786041259766e-05, 8.425116539001465e-05, 0.00012505054473876953, 0.00016584992408752441, 0.0002066493034362793, 0.0002474486827850342, 0.00028824806213378906, 0.00032904744148254395, 0.00036984682083129883, 0.0004106462001800537, 0.0004514455795288086, 0.0004922449588775635, 0.0005330443382263184, 0.0005738437175750732, 0.0006146430969238281, 0.000655442476272583, 0.0006962418556213379, 0.0007370412349700928, 0.0007778406143188477, 0.0008186399936676025, 0.0008594393730163574, 0.0009002387523651123, 0.0009410381317138672, 0.000981837511062622, 0.001022636890411377, 0.0010634362697601318, 0.0011042356491088867, 0.0011450350284576416, 0.0011858344078063965, 0.0012266337871551514, 0.0012674331665039062]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 5.0, 5.0, 8.0, 9.0, 21.0, 31.0, 46.0, 82.0, 146.0, 254.0, 551.0, 1039.0, 2489.0, 7313.0, 38703.0, 302873.0, 580749.0, 93855.0, 13693.0, 3760.0, 1453.0, 660.0, 344.0, 196.0, 94.0, 64.0, 41.0, 29.0, 13.0, 10.0, 9.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.63671875, -6.4583740234375, -6.280029296875, -6.1016845703125, -5.92333984375, -5.7449951171875, -5.566650390625, -5.3883056640625, -5.2099609375, -5.0316162109375, -4.853271484375, -4.6749267578125, -4.49658203125, -4.3182373046875, -4.139892578125, -3.9615478515625, -3.783203125, -3.6048583984375, -3.426513671875, -3.2481689453125, -3.06982421875, -2.8914794921875, -2.713134765625, -2.5347900390625, -2.3564453125, -2.1781005859375, -1.999755859375, -1.8214111328125, -1.64306640625, -1.4647216796875, -1.286376953125, -1.1080322265625, -0.9296875, -0.7513427734375, -0.572998046875, -0.3946533203125, -0.21630859375, -0.0379638671875, 0.140380859375, 0.3187255859375, 0.4970703125, 0.6754150390625, 0.853759765625, 1.0321044921875, 1.21044921875, 1.3887939453125, 1.567138671875, 1.7454833984375, 1.923828125, 2.1021728515625, 2.280517578125, 2.4588623046875, 2.63720703125, 2.8155517578125, 2.993896484375, 3.1722412109375, 3.3505859375, 3.5289306640625, 3.707275390625, 3.8856201171875, 4.06396484375, 4.2423095703125, 4.420654296875, 4.5989990234375, 4.77734375]}, "gradients/decoder.model.decoder.layers.1.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 2.0, 2.0, 11.0, 8.0, 14.0, 12.0, 24.0, 20.0, 35.0, 29.0, 53.0, 51.0, 74.0, 107.0, 127.0, 97.0, 75.0, 54.0, 48.0, 42.0, 29.0, 29.0, 14.0, 12.0, 7.0, 9.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84375, -1.778350830078125, -1.71295166015625, -1.647552490234375, -1.5821533203125, -1.516754150390625, -1.45135498046875, -1.385955810546875, -1.320556640625, -1.255157470703125, -1.18975830078125, -1.124359130859375, -1.0589599609375, -0.993560791015625, -0.92816162109375, -0.862762451171875, -0.79736328125, -0.731964111328125, -0.66656494140625, -0.601165771484375, -0.5357666015625, -0.470367431640625, -0.40496826171875, -0.339569091796875, -0.274169921875, -0.208770751953125, -0.14337158203125, -0.077972412109375, -0.0125732421875, 0.052825927734375, 0.11822509765625, 0.183624267578125, 0.2490234375, 0.314422607421875, 0.37982177734375, 0.445220947265625, 0.5106201171875, 0.576019287109375, 0.64141845703125, 0.706817626953125, 0.772216796875, 0.837615966796875, 0.90301513671875, 0.968414306640625, 1.0338134765625, 1.099212646484375, 1.16461181640625, 1.230010986328125, 1.29541015625, 1.360809326171875, 1.42620849609375, 1.491607666015625, 1.5570068359375, 1.622406005859375, 1.68780517578125, 1.753204345703125, 1.818603515625, 1.884002685546875, 1.94940185546875, 2.014801025390625, 2.0802001953125, 2.145599365234375, 2.21099853515625, 2.276397705078125, 2.341796875]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 18.0, 62.0, 136.0, 267.0, 219.0, 175.0, 88.0, 33.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.592041015625, -18.567249298095703, -16.542457580566406, -14.517667770385742, -12.492876052856445, -10.468084335327148, -8.443293571472168, -6.4185028076171875, -4.393711090087891, -2.368919849395752, -0.3441286087036133, 1.6806626319885254, 3.705453872680664, 5.730245590209961, 7.755036354064941, 9.779827117919922, 11.804618835449219, 13.829410552978516, 15.854201316833496, 17.878992080688477, 19.903783798217773, 21.92857551574707, 23.953365325927734, 25.97815704345703, 28.002948760986328, 30.027740478515625, 32.05253219604492, 34.07732391357422, 36.10211181640625, 38.12690734863281, 40.151695251464844, 42.17648696899414, 44.20127868652344, 46.226070404052734, 48.25086212158203, 50.27565383911133, 52.300445556640625, 54.325233459472656, 56.35002517700195, 58.37481689453125, 60.39960861206055, 62.424400329589844, 64.44918823242188, 66.47398376464844, 68.49877166748047, 70.52356719970703, 72.54835510253906, 74.57315063476562, 76.59793853759766, 78.62272644042969, 80.64752197265625, 82.67230987548828, 84.69710540771484, 86.72189331054688, 88.74668884277344, 90.77147674560547, 92.7962646484375, 94.82105255126953, 96.8458480834961, 98.87063598632812, 100.89543151855469, 102.92021942138672, 104.94501495361328, 106.96980285644531, 108.99459838867188]}, "gradients/decoder.model.decoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 7.0, 4.0, 5.0, 11.0, 4.0, 12.0, 15.0, 9.0, 18.0, 12.0, 28.0, 15.0, 22.0, 36.0, 36.0, 32.0, 37.0, 41.0, 35.0, 45.0, 41.0, 48.0, 34.0, 37.0, 47.0, 43.0, 37.0, 29.0, 34.0, 23.0, 30.0, 22.0, 26.0, 25.0, 13.0, 14.0, 20.0, 7.0, 7.0, 9.0, 4.0, 6.0, 5.0, 1.0, 7.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.705760955810547, -21.92562484741211, -21.14548683166504, -20.3653507232666, -19.58521270751953, -18.805076599121094, -18.024938583374023, -17.244802474975586, -16.464664459228516, -15.684527397155762, -14.904390335083008, -14.124253273010254, -13.3441162109375, -12.563979148864746, -11.783842086791992, -11.003705978393555, -10.2235689163208, -9.443431854248047, -8.663294792175293, -7.883157730102539, -7.103020668029785, -6.322883605957031, -5.5427470207214355, -4.762609958648682, -3.9824728965759277, -3.202335834503174, -2.42219877243042, -1.6420619487762451, -0.8619248867034912, -0.0817878246307373, 0.6983489990234375, 1.4784860610961914, 2.2586231231689453, 3.038760185241699, 3.818897247314453, 4.599034309387207, 5.379171371459961, 6.159308433532715, 6.9394450187683105, 7.7195820808410645, 8.499719619750977, 9.27985668182373, 10.059993743896484, 10.840130805969238, 11.620267868041992, 12.400404930114746, 13.1805419921875, 13.960678100585938, 14.740815162658691, 15.520952224731445, 16.301088333129883, 17.081226348876953, 17.86136245727539, 18.64150047302246, 19.4216365814209, 20.20177459716797, 20.981910705566406, 21.762046813964844, 22.542184829711914, 23.32232093811035, 24.102458953857422, 24.88259506225586, 25.66273307800293, 26.442869186401367, 27.223007202148438]}, "gradients/decoder.model.decoder.layers.0.fc2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 9.0, 7.0, 8.0, 13.0, 13.0, 19.0, 25.0, 26.0, 34.0, 64.0, 67.0, 111.0, 230.0, 513.0, 1606.0, 8811.0, 106056.0, 1987427.0, 1974078.0, 102622.0, 9189.0, 1970.0, 628.0, 258.0, 156.0, 92.0, 55.0, 32.0, 32.0, 21.0, 16.0, 18.0, 15.0, 13.0, 5.0, 8.0, 7.0, 5.0, 6.0, 3.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-20.34375, -19.7080078125, -19.072265625, -18.4365234375, -17.80078125, -17.1650390625, -16.529296875, -15.8935546875, -15.2578125, -14.6220703125, -13.986328125, -13.3505859375, -12.71484375, -12.0791015625, -11.443359375, -10.8076171875, -10.171875, -9.5361328125, -8.900390625, -8.2646484375, -7.62890625, -6.9931640625, -6.357421875, -5.7216796875, -5.0859375, -4.4501953125, -3.814453125, -3.1787109375, -2.54296875, -1.9072265625, -1.271484375, -0.6357421875, 0.0, 0.6357421875, 1.271484375, 1.9072265625, 2.54296875, 3.1787109375, 3.814453125, 4.4501953125, 5.0859375, 5.7216796875, 6.357421875, 6.9931640625, 7.62890625, 8.2646484375, 8.900390625, 9.5361328125, 10.171875, 10.8076171875, 11.443359375, 12.0791015625, 12.71484375, 13.3505859375, 13.986328125, 14.6220703125, 15.2578125, 15.8935546875, 16.529296875, 17.1650390625, 17.80078125, 18.4365234375, 19.072265625, 19.7080078125, 20.34375]}, "gradients/decoder.model.decoder.layers.0.fc2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 8.0, 4.0, 10.0, 10.0, 10.0, 10.0, 13.0, 21.0, 23.0, 21.0, 17.0, 35.0, 37.0, 41.0, 33.0, 55.0, 49.0, 38.0, 50.0, 53.0, 57.0, 44.0, 57.0, 35.0, 46.0, 35.0, 22.0, 32.0, 17.0, 22.0, 23.0, 14.0, 15.0, 11.0, 11.0, 6.0, 6.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.265625, -9.995849609375, -9.72607421875, -9.456298828125, -9.1865234375, -8.916748046875, -8.64697265625, -8.377197265625, -8.107421875, -7.837646484375, -7.56787109375, -7.298095703125, -7.0283203125, -6.758544921875, -6.48876953125, -6.218994140625, -5.94921875, -5.679443359375, -5.40966796875, -5.139892578125, -4.8701171875, -4.600341796875, -4.33056640625, -4.060791015625, -3.791015625, -3.521240234375, -3.25146484375, -2.981689453125, -2.7119140625, -2.442138671875, -2.17236328125, -1.902587890625, -1.6328125, -1.363037109375, -1.09326171875, -0.823486328125, -0.5537109375, -0.283935546875, -0.01416015625, 0.255615234375, 0.525390625, 0.795166015625, 1.06494140625, 1.334716796875, 1.6044921875, 1.874267578125, 2.14404296875, 2.413818359375, 2.68359375, 2.953369140625, 3.22314453125, 3.492919921875, 3.7626953125, 4.032470703125, 4.30224609375, 4.572021484375, 4.841796875, 5.111572265625, 5.38134765625, 5.651123046875, 5.9208984375, 6.190673828125, 6.46044921875, 6.730224609375, 7.0]}, "gradients/decoder.model.decoder.layers.0.fc1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 4.0, 8.0, 8.0, 20.0, 26.0, 67.0, 164.0, 471.0, 1513.0, 10745.0, 3377873.0, 796286.0, 5292.0, 1164.0, 382.0, 138.0, 68.0, 26.0, 19.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-41.90625, -40.548828125, -39.19140625, -37.833984375, -36.4765625, -35.119140625, -33.76171875, -32.404296875, -31.046875, -29.689453125, -28.33203125, -26.974609375, -25.6171875, -24.259765625, -22.90234375, -21.544921875, -20.1875, -18.830078125, -17.47265625, -16.115234375, -14.7578125, -13.400390625, -12.04296875, -10.685546875, -9.328125, -7.970703125, -6.61328125, -5.255859375, -3.8984375, -2.541015625, -1.18359375, 0.173828125, 1.53125, 2.888671875, 4.24609375, 5.603515625, 6.9609375, 8.318359375, 9.67578125, 11.033203125, 12.390625, 13.748046875, 15.10546875, 16.462890625, 17.8203125, 19.177734375, 20.53515625, 21.892578125, 23.25, 24.607421875, 25.96484375, 27.322265625, 28.6796875, 30.037109375, 31.39453125, 32.751953125, 34.109375, 35.466796875, 36.82421875, 38.181640625, 39.5390625, 40.896484375, 42.25390625, 43.611328125, 44.96875]}, "gradients/decoder.model.decoder.layers.0.fc1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 11.0, 35.0, 40.0, 102.0, 221.0, 423.0, 843.0, 967.0, 707.0, 383.0, 187.0, 74.0, 31.0, 24.0, 12.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4765625, -9.201171875, -8.92578125, -8.650390625, -8.375, -8.099609375, -7.82421875, -7.548828125, -7.2734375, -6.998046875, -6.72265625, -6.447265625, -6.171875, -5.896484375, -5.62109375, -5.345703125, -5.0703125, -4.794921875, -4.51953125, -4.244140625, -3.96875, -3.693359375, -3.41796875, -3.142578125, -2.8671875, -2.591796875, -2.31640625, -2.041015625, -1.765625, -1.490234375, -1.21484375, -0.939453125, -0.6640625, -0.388671875, -0.11328125, 0.162109375, 0.4375, 0.712890625, 0.98828125, 1.263671875, 1.5390625, 1.814453125, 2.08984375, 2.365234375, 2.640625, 2.916015625, 3.19140625, 3.466796875, 3.7421875, 4.017578125, 4.29296875, 4.568359375, 4.84375, 5.119140625, 5.39453125, 5.669921875, 5.9453125, 6.220703125, 6.49609375, 6.771484375, 7.046875, 7.322265625, 7.59765625, 7.873046875, 8.1484375]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 5.0, 0.0, 4.0, 5.0, 5.0, 5.0, 8.0, 11.0, 8.0, 15.0, 19.0, 22.0, 19.0, 22.0, 30.0, 27.0, 28.0, 41.0, 30.0, 38.0, 46.0, 45.0, 45.0, 47.0, 34.0, 39.0, 43.0, 42.0, 34.0, 27.0, 31.0, 29.0, 24.0, 26.0, 20.0, 18.0, 27.0, 19.0, 11.0, 5.0, 9.0, 10.0, 7.0, 9.0, 6.0, 1.0, 1.0, 6.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-7.737438678741455, -7.48686408996582, -7.236289978027344, -6.985715389251709, -6.735140800476074, -6.484566688537598, -6.233992099761963, -5.983417510986328, -5.732843399047852, -5.482268810272217, -5.23169469833374, -4.9811201095581055, -4.730545520782471, -4.479970932006836, -4.229396820068359, -3.9788222312927246, -3.72824764251709, -3.477673292160034, -3.2270987033843994, -2.9765243530273438, -2.725949764251709, -2.4753754138946533, -2.2248010635375977, -1.9742265939712524, -1.7236521244049072, -1.473077654838562, -1.2225031852722168, -0.9719288349151611, -0.7213543653488159, -0.4707798957824707, -0.22020554542541504, 0.030368924140930176, 0.2809438705444336, 0.5315183401107788, 0.7820927500724792, 1.0326671600341797, 1.283241629600525, 1.5338160991668701, 1.7843904495239258, 2.0349650382995605, 2.285539388656616, 2.536113739013672, 2.7866883277893066, 3.0372626781463623, 3.287837028503418, 3.5384116172790527, 3.7889859676361084, 4.039560317993164, 4.290134906768799, 4.540709495544434, 4.79128360748291, 5.041858196258545, 5.29243278503418, 5.543006896972656, 5.793581485748291, 6.044156074523926, 6.294730186462402, 6.545304775238037, 6.795878887176514, 7.046453475952148, 7.297028064727783, 7.547602653503418, 7.7981767654418945, 8.048750877380371, 8.299325942993164]}, "gradients/decoder.model.decoder.layers.0.encoder_attn_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 1.0, 6.0, 8.0, 6.0, 13.0, 8.0, 14.0, 16.0, 21.0, 15.0, 23.0, 20.0, 32.0, 18.0, 27.0, 28.0, 35.0, 39.0, 37.0, 35.0, 43.0, 34.0, 39.0, 28.0, 41.0, 47.0, 26.0, 38.0, 37.0, 26.0, 31.0, 30.0, 25.0, 34.0, 15.0, 12.0, 19.0, 17.0, 9.0, 9.0, 6.0, 4.0, 6.0, 3.0, 3.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.115252494812012, -8.842390060424805, -8.569527626037598, -8.296666145324707, -8.0238037109375, -7.750941276550293, -7.478078842163086, -7.205216407775879, -6.93235445022583, -6.659492015838623, -6.386630058288574, -6.113767623901367, -5.84090518951416, -5.568043231964111, -5.295180797576904, -5.0223188400268555, -4.749456405639648, -4.476593971252441, -4.203732013702393, -3.9308695793151855, -3.6580073833465576, -3.3851451873779297, -3.1122827529907227, -2.8394205570220947, -2.566558361053467, -2.293696165084839, -2.020833969116211, -1.747971534729004, -1.475109338760376, -1.202247142791748, -0.9293848276138306, -0.6565225124359131, -0.38366127014160156, -0.11079901456832886, 0.16206324100494385, 0.43492549657821655, 0.7077877521514893, 0.9806499481201172, 1.2535122632980347, 1.5263745784759521, 1.79923677444458, 2.072098970413208, 2.344961166381836, 2.617823600769043, 2.890685796737671, 3.163547992706299, 3.436410427093506, 3.709272623062134, 3.9821348190307617, 4.254997253417969, 4.527859210968018, 4.800721645355225, 5.073583602905273, 5.3464460372924805, 5.6193084716796875, 5.8921709060668945, 6.165032863616943, 6.43789529800415, 6.710757255554199, 6.983619689941406, 7.256482124328613, 7.529344081878662, 7.802206516265869, 8.075068473815918, 8.347930908203125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 7.0, 4.0, 9.0, 13.0, 14.0, 23.0, 29.0, 31.0, 40.0, 48.0, 53.0, 87.0, 120.0, 139.0, 207.0, 218.0, 341.0, 569.0, 1232.0, 3884.0, 17445.0, 91359.0, 386739.0, 413903.0, 104447.0, 19758.0, 4427.0, 1336.0, 599.0, 356.0, 246.0, 199.0, 144.0, 116.0, 91.0, 49.0, 60.0, 39.0, 40.0, 29.0, 20.0, 26.0, 13.0, 7.0, 3.0, 5.0, 4.0, 11.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0], "bins": [-3.171875, -3.0728759765625, -2.973876953125, -2.8748779296875, -2.77587890625, -2.6768798828125, -2.577880859375, -2.4788818359375, -2.3798828125, -2.2808837890625, -2.181884765625, -2.0828857421875, -1.98388671875, -1.8848876953125, -1.785888671875, -1.6868896484375, -1.587890625, -1.4888916015625, -1.389892578125, -1.2908935546875, -1.19189453125, -1.0928955078125, -0.993896484375, -0.8948974609375, -0.7958984375, -0.6968994140625, -0.597900390625, -0.4989013671875, -0.39990234375, -0.3009033203125, -0.201904296875, -0.1029052734375, -0.00390625, 0.0950927734375, 0.194091796875, 0.2930908203125, 0.39208984375, 0.4910888671875, 0.590087890625, 0.6890869140625, 0.7880859375, 0.8870849609375, 0.986083984375, 1.0850830078125, 1.18408203125, 1.2830810546875, 1.382080078125, 1.4810791015625, 1.580078125, 1.6790771484375, 1.778076171875, 1.8770751953125, 1.97607421875, 2.0750732421875, 2.174072265625, 2.2730712890625, 2.3720703125, 2.4710693359375, 2.570068359375, 2.6690673828125, 2.76806640625, 2.8670654296875, 2.966064453125, 3.0650634765625, 3.1640625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.out_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 1.0, 6.0, 8.0, 11.0, 10.0, 20.0, 17.0, 17.0, 16.0, 11.0, 22.0, 29.0, 26.0, 20.0, 31.0, 31.0, 22.0, 44.0, 29.0, 31.0, 34.0, 35.0, 38.0, 34.0, 35.0, 29.0, 41.0, 28.0, 38.0, 29.0, 29.0, 21.0, 29.0, 25.0, 25.0, 15.0, 17.0, 10.0, 18.0, 13.0, 4.0, 10.0, 5.0, 5.0, 4.0, 3.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 3.0], "bins": [-5.30859375, -5.144287109375, -4.97998046875, -4.815673828125, -4.6513671875, -4.487060546875, -4.32275390625, -4.158447265625, -3.994140625, -3.829833984375, -3.66552734375, -3.501220703125, -3.3369140625, -3.172607421875, -3.00830078125, -2.843994140625, -2.6796875, -2.515380859375, -2.35107421875, -2.186767578125, -2.0224609375, -1.858154296875, -1.69384765625, -1.529541015625, -1.365234375, -1.200927734375, -1.03662109375, -0.872314453125, -0.7080078125, -0.543701171875, -0.37939453125, -0.215087890625, -0.05078125, 0.113525390625, 0.27783203125, 0.442138671875, 0.6064453125, 0.770751953125, 0.93505859375, 1.099365234375, 1.263671875, 1.427978515625, 1.59228515625, 1.756591796875, 1.9208984375, 2.085205078125, 2.24951171875, 2.413818359375, 2.578125, 2.742431640625, 2.90673828125, 3.071044921875, 3.2353515625, 3.399658203125, 3.56396484375, 3.728271484375, 3.892578125, 4.056884765625, 4.22119140625, 4.385498046875, 4.5498046875, 4.714111328125, 4.87841796875, 5.042724609375, 5.20703125]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 3.0, 11.0, 12.0, 20.0, 39.0, 36.0, 58.0, 97.0, 160.0, 258.0, 430.0, 736.0, 1286.0, 2398.0, 4379.0, 8141.0, 15599.0, 30144.0, 57765.0, 106275.0, 173146.0, 217148.0, 182793.0, 114878.0, 62960.0, 32981.0, 17043.0, 9065.0, 4815.0, 2531.0, 1394.0, 779.0, 476.0, 258.0, 161.0, 97.0, 59.0, 44.0, 27.0, 15.0, 14.0, 14.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.169921875, -1.134002685546875, -1.09808349609375, -1.062164306640625, -1.0262451171875, -0.990325927734375, -0.95440673828125, -0.918487548828125, -0.882568359375, -0.846649169921875, -0.81072998046875, -0.774810791015625, -0.7388916015625, -0.702972412109375, -0.66705322265625, -0.631134033203125, -0.59521484375, -0.559295654296875, -0.52337646484375, -0.487457275390625, -0.4515380859375, -0.415618896484375, -0.37969970703125, -0.343780517578125, -0.307861328125, -0.271942138671875, -0.23602294921875, -0.200103759765625, -0.1641845703125, -0.128265380859375, -0.09234619140625, -0.056427001953125, -0.0205078125, 0.015411376953125, 0.05133056640625, 0.087249755859375, 0.1231689453125, 0.159088134765625, 0.19500732421875, 0.230926513671875, 0.266845703125, 0.302764892578125, 0.33868408203125, 0.374603271484375, 0.4105224609375, 0.446441650390625, 0.48236083984375, 0.518280029296875, 0.55419921875, 0.590118408203125, 0.62603759765625, 0.661956787109375, 0.6978759765625, 0.733795166015625, 0.76971435546875, 0.805633544921875, 0.841552734375, 0.877471923828125, 0.91339111328125, 0.949310302734375, 0.9852294921875, 1.021148681640625, 1.05706787109375, 1.092987060546875, 1.12890625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 9.0, 4.0, 9.0, 7.0, 7.0, 11.0, 9.0, 17.0, 25.0, 23.0, 25.0, 25.0, 26.0, 34.0, 45.0, 37.0, 36.0, 38.0, 54.0, 49.0, 69.0, 46.0, 41.0, 46.0, 42.0, 41.0, 38.0, 33.0, 24.0, 21.0, 11.0, 21.0, 12.0, 11.0, 17.0, 9.0, 11.0, 2.0, 9.0, 5.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.09375, -14.554931640625, -14.01611328125, -13.477294921875, -12.9384765625, -12.399658203125, -11.86083984375, -11.322021484375, -10.783203125, -10.244384765625, -9.70556640625, -9.166748046875, -8.6279296875, -8.089111328125, -7.55029296875, -7.011474609375, -6.47265625, -5.933837890625, -5.39501953125, -4.856201171875, -4.3173828125, -3.778564453125, -3.23974609375, -2.700927734375, -2.162109375, -1.623291015625, -1.08447265625, -0.545654296875, -0.0068359375, 0.531982421875, 1.07080078125, 1.609619140625, 2.1484375, 2.687255859375, 3.22607421875, 3.764892578125, 4.3037109375, 4.842529296875, 5.38134765625, 5.920166015625, 6.458984375, 6.997802734375, 7.53662109375, 8.075439453125, 8.6142578125, 9.153076171875, 9.69189453125, 10.230712890625, 10.76953125, 11.308349609375, 11.84716796875, 12.385986328125, 12.9248046875, 13.463623046875, 14.00244140625, 14.541259765625, 15.080078125, 15.618896484375, 16.15771484375, 16.696533203125, 17.2353515625, 17.774169921875, 18.31298828125, 18.851806640625, 19.390625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 4.0, 6.0, 8.0, 10.0, 13.0, 12.0, 19.0, 24.0, 24.0, 31.0, 46.0, 45.0, 71.0, 89.0, 141.0, 218.0, 445.0, 1158.0, 3557.0, 15547.0, 148696.0, 746074.0, 114123.0, 12755.0, 3142.0, 1107.0, 411.0, 197.0, 126.0, 83.0, 80.0, 50.0, 42.0, 43.0, 34.0, 21.0, 12.0, 19.0, 17.0, 10.0, 12.0, 10.0, 4.0, 7.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.9501953125, -0.9233932495117188, -0.8965911865234375, -0.8697891235351562, -0.842987060546875, -0.8161849975585938, -0.7893829345703125, -0.7625808715820312, -0.73577880859375, -0.7089767456054688, -0.6821746826171875, -0.6553726196289062, -0.628570556640625, -0.6017684936523438, -0.5749664306640625, -0.5481643676757812, -0.5213623046875, -0.49456024169921875, -0.4677581787109375, -0.44095611572265625, -0.414154052734375, -0.38735198974609375, -0.3605499267578125, -0.33374786376953125, -0.30694580078125, -0.28014373779296875, -0.2533416748046875, -0.22653961181640625, -0.199737548828125, -0.17293548583984375, -0.1461334228515625, -0.11933135986328125, -0.092529296875, -0.06572723388671875, -0.0389251708984375, -0.01212310791015625, 0.014678955078125, 0.04148101806640625, 0.0682830810546875, 0.09508514404296875, 0.12188720703125, 0.14868927001953125, 0.1754913330078125, 0.20229339599609375, 0.229095458984375, 0.25589752197265625, 0.2826995849609375, 0.30950164794921875, 0.3363037109375, 0.36310577392578125, 0.3899078369140625, 0.41670989990234375, 0.443511962890625, 0.47031402587890625, 0.4971160888671875, 0.5239181518554688, 0.55072021484375, 0.5775222778320312, 0.6043243408203125, 0.6311264038085938, 0.657928466796875, 0.6847305297851562, 0.7115325927734375, 0.7383346557617188, 0.76513671875]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 10.0, 10.0, 11.0, 20.0, 19.0, 43.0, 48.0, 77.0, 109.0, 104.0, 106.0, 125.0, 82.0, 72.0, 62.0, 35.0, 25.0, 22.0, 8.0, 7.0, 3.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002281665802001953, -0.00021881237626075745, -0.00020945817232131958, -0.00020010396838188171, -0.00019074976444244385, -0.00018139556050300598, -0.00017204135656356812, -0.00016268715262413025, -0.00015333294868469238, -0.00014397874474525452, -0.00013462454080581665, -0.00012527033686637878, -0.00011591613292694092, -0.00010656192898750305, -9.720772504806519e-05, -8.785352110862732e-05, -7.849931716918945e-05, -6.914511322975159e-05, -5.979090929031372e-05, -5.0436705350875854e-05, -4.108250141143799e-05, -3.172829747200012e-05, -2.2374093532562256e-05, -1.301988959312439e-05, -3.6656856536865234e-06, 5.688518285751343e-06, 1.5042722225189209e-05, 2.4396926164627075e-05, 3.375113010406494e-05, 4.310533404350281e-05, 5.2459537982940674e-05, 6.181374192237854e-05, 7.11679458618164e-05, 8.052214980125427e-05, 8.987635374069214e-05, 9.923055768013e-05, 0.00010858476161956787, 0.00011793896555900574, 0.0001272931694984436, 0.00013664737343788147, 0.00014600157737731934, 0.0001553557813167572, 0.00016470998525619507, 0.00017406418919563293, 0.0001834183931350708, 0.00019277259707450867, 0.00020212680101394653, 0.0002114810049533844, 0.00022083520889282227, 0.00023018941283226013, 0.000239543616771698, 0.00024889782071113586, 0.00025825202465057373, 0.0002676062285900116, 0.00027696043252944946, 0.00028631463646888733, 0.0002956688404083252, 0.00030502304434776306, 0.00031437724828720093, 0.0003237314522266388, 0.00033308565616607666, 0.0003424398601055145, 0.0003517940640449524, 0.00036114826798439026, 0.0003705024719238281]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 5.0, 9.0, 8.0, 11.0, 21.0, 25.0, 31.0, 60.0, 101.0, 168.0, 306.0, 504.0, 868.0, 1509.0, 2560.0, 4887.0, 9650.0, 22113.0, 58371.0, 193172.0, 460391.0, 193957.0, 58043.0, 21530.0, 9564.0, 4771.0, 2448.0, 1463.0, 795.0, 482.0, 291.0, 179.0, 107.0, 47.0, 42.0, 18.0, 11.0, 15.0, 5.0, 6.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5224609375, -0.5063858032226562, -0.4903106689453125, -0.47423553466796875, -0.458160400390625, -0.44208526611328125, -0.4260101318359375, -0.40993499755859375, -0.39385986328125, -0.37778472900390625, -0.3617095947265625, -0.34563446044921875, -0.329559326171875, -0.31348419189453125, -0.2974090576171875, -0.28133392333984375, -0.2652587890625, -0.24918365478515625, -0.2331085205078125, -0.21703338623046875, -0.200958251953125, -0.18488311767578125, -0.1688079833984375, -0.15273284912109375, -0.13665771484375, -0.12058258056640625, -0.1045074462890625, -0.08843231201171875, -0.072357177734375, -0.05628204345703125, -0.0402069091796875, -0.02413177490234375, -0.008056640625, 0.00801849365234375, 0.0240936279296875, 0.04016876220703125, 0.056243896484375, 0.07231903076171875, 0.0883941650390625, 0.10446929931640625, 0.12054443359375, 0.13661956787109375, 0.1526947021484375, 0.16876983642578125, 0.184844970703125, 0.20092010498046875, 0.2169952392578125, 0.23307037353515625, 0.2491455078125, 0.26522064208984375, 0.2812957763671875, 0.29737091064453125, 0.313446044921875, 0.32952117919921875, 0.3455963134765625, 0.36167144775390625, 0.37774658203125, 0.39382171630859375, 0.4098968505859375, 0.42597198486328125, 0.442047119140625, 0.45812225341796875, 0.4741973876953125, 0.49027252197265625, 0.50634765625]}, "gradients/decoder.model.decoder.layers.0.encoder_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 3.0, 4.0, 16.0, 13.0, 13.0, 23.0, 39.0, 49.0, 92.0, 130.0, 147.0, 137.0, 101.0, 60.0, 49.0, 21.0, 24.0, 15.0, 9.0, 8.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.245361328125, -0.2378520965576172, -0.23034286499023438, -0.22283363342285156, -0.21532440185546875, -0.20781517028808594, -0.20030593872070312, -0.1927967071533203, -0.1852874755859375, -0.1777782440185547, -0.17026901245117188, -0.16275978088378906, -0.15525054931640625, -0.14774131774902344, -0.14023208618164062, -0.1327228546142578, -0.125213623046875, -0.11770439147949219, -0.11019515991210938, -0.10268592834472656, -0.09517669677734375, -0.08766746520996094, -0.08015823364257812, -0.07264900207519531, -0.0651397705078125, -0.05763053894042969, -0.050121307373046875, -0.04261207580566406, -0.03510284423828125, -0.027593612670898438, -0.020084381103515625, -0.012575149536132812, -0.00506591796875, 0.0024433135986328125, 0.009952545166015625, 0.017461776733398438, 0.02497100830078125, 0.03248023986816406, 0.039989471435546875, 0.04749870300292969, 0.0550079345703125, 0.06251716613769531, 0.07002639770507812, 0.07753562927246094, 0.08504486083984375, 0.09255409240722656, 0.10006332397460938, 0.10757255554199219, 0.115081787109375, 0.12259101867675781, 0.13010025024414062, 0.13760948181152344, 0.14511871337890625, 0.15262794494628906, 0.16013717651367188, 0.1676464080810547, 0.1751556396484375, 0.1826648712158203, 0.19017410278320312, 0.19768333435058594, 0.20519256591796875, 0.21270179748535156, 0.22021102905273438, 0.2277202606201172, 0.2352294921875]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 3.0, 6.0, 8.0, 9.0, 8.0, 15.0, 22.0, 24.0, 25.0, 30.0, 35.0, 38.0, 49.0, 47.0, 56.0, 43.0, 76.0, 66.0, 57.0, 48.0, 47.0, 40.0, 38.0, 43.0, 37.0, 15.0, 23.0, 13.0, 19.0, 14.0, 13.0, 11.0, 12.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.263401508331299, -5.063150882720947, -4.862900257110596, -4.662649631500244, -4.462399005889893, -4.262148380279541, -4.0618977546691895, -3.861647129058838, -3.6613965034484863, -3.4611458778381348, -3.260895252227783, -3.0606446266174316, -2.86039400100708, -2.6601433753967285, -2.459892749786377, -2.2596421241760254, -2.059391736984253, -1.8591411113739014, -1.6588904857635498, -1.4586398601531982, -1.2583892345428467, -1.0581387281417847, -0.8578881025314331, -0.6576374769210815, -0.45738685131073, -0.2571362257003784, -0.05688562989234924, 0.14336496591567993, 0.3436155915260315, 0.5438661575317383, 0.7441167831420898, 0.9443674087524414, 1.144618034362793, 1.3448686599731445, 1.545119285583496, 1.7453699111938477, 1.9456205368041992, 2.145871162414551, 2.3461217880249023, 2.546372413635254, 2.7466230392456055, 2.946873664855957, 3.1471242904663086, 3.34737491607666, 3.5476255416870117, 3.7478761672973633, 3.948126792907715, 4.148377418518066, 4.348628044128418, 4.5488786697387695, 4.749129295349121, 4.949379920959473, 5.149630546569824, 5.349881172180176, 5.550131797790527, 5.750382423400879, 5.950632572174072, 6.150883197784424, 6.351133823394775, 6.551384449005127, 6.7516350746154785, 6.95188570022583, 7.152136325836182, 7.352386951446533, 7.552637577056885]}, "gradients/decoder.model.decoder.layers.0.self_attn_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 2.0, 5.0, 5.0, 7.0, 9.0, 7.0, 8.0, 15.0, 14.0, 23.0, 24.0, 12.0, 25.0, 27.0, 25.0, 28.0, 35.0, 31.0, 42.0, 38.0, 39.0, 32.0, 52.0, 30.0, 31.0, 45.0, 39.0, 34.0, 29.0, 35.0, 42.0, 33.0, 27.0, 27.0, 19.0, 16.0, 20.0, 10.0, 14.0, 7.0, 11.0, 2.0, 5.0, 3.0, 7.0, 1.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.60914945602417, -5.433292865753174, -5.257436752319336, -5.08158016204834, -4.905724048614502, -4.729867458343506, -4.554011344909668, -4.378154754638672, -4.202298164367676, -4.02644157409668, -3.850585460662842, -3.6747288703918457, -3.498872756958008, -3.3230161666870117, -3.1471598148345947, -2.9713034629821777, -2.79544734954834, -2.619590997695923, -2.443734645843506, -2.2678780555725098, -2.092021942138672, -1.9161654710769653, -1.7403090000152588, -1.5644526481628418, -1.3885962963104248, -1.2127399444580078, -1.0368835926055908, -0.8610271215438843, -0.6851707696914673, -0.5093144178390503, -0.33345794677734375, -0.15760159492492676, 0.01825428009033203, 0.1941106617450714, 0.3699670433998108, 0.5458234548568726, 0.7216798067092896, 0.8975361585617065, 1.073392629623413, 1.24924898147583, 1.425105333328247, 1.600961685180664, 1.776818037033081, 1.9526745080947876, 2.128530979156494, 2.304387092590332, 2.480243682861328, 2.656100034713745, 2.831956386566162, 3.007812738418579, 3.183669090270996, 3.359525680541992, 3.53538179397583, 3.711238384246826, 3.887094736099243, 4.06295108795166, 4.238807678222656, 4.414664268493652, 4.59052038192749, 4.766376972198486, 4.942233085632324, 5.11808967590332, 5.293946266174316, 5.469802379608154, 5.645658493041992]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 7.0, 6.0, 18.0, 18.0, 22.0, 24.0, 40.0, 41.0, 67.0, 97.0, 161.0, 186.0, 316.0, 512.0, 982.0, 1854.0, 3863.0, 8508.0, 19715.0, 46467.0, 103653.0, 198394.0, 266874.0, 202730.0, 107616.0, 48493.0, 20504.0, 8821.0, 4005.0, 1931.0, 980.0, 585.0, 342.0, 218.0, 137.0, 83.0, 68.0, 56.0, 38.0, 30.0, 20.0, 19.0, 9.0, 9.0, 6.0, 3.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-8.03125, -7.7764892578125, -7.521728515625, -7.2669677734375, -7.01220703125, -6.7574462890625, -6.502685546875, -6.2479248046875, -5.9931640625, -5.7384033203125, -5.483642578125, -5.2288818359375, -4.97412109375, -4.7193603515625, -4.464599609375, -4.2098388671875, -3.955078125, -3.7003173828125, -3.445556640625, -3.1907958984375, -2.93603515625, -2.6812744140625, -2.426513671875, -2.1717529296875, -1.9169921875, -1.6622314453125, -1.407470703125, -1.1527099609375, -0.89794921875, -0.6431884765625, -0.388427734375, -0.1336669921875, 0.12109375, 0.3758544921875, 0.630615234375, 0.8853759765625, 1.14013671875, 1.3948974609375, 1.649658203125, 1.9044189453125, 2.1591796875, 2.4139404296875, 2.668701171875, 2.9234619140625, 3.17822265625, 3.4329833984375, 3.687744140625, 3.9425048828125, 4.197265625, 4.4520263671875, 4.706787109375, 4.9615478515625, 5.21630859375, 5.4710693359375, 5.725830078125, 5.9805908203125, 6.2353515625, 6.4901123046875, 6.744873046875, 6.9996337890625, 7.25439453125, 7.5091552734375, 7.763916015625, 8.0186767578125, 8.2734375]}, "gradients/decoder.model.decoder.layers.0.self_attn.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 5.0, 11.0, 4.0, 4.0, 11.0, 12.0, 13.0, 14.0, 25.0, 26.0, 32.0, 22.0, 36.0, 29.0, 36.0, 44.0, 47.0, 37.0, 45.0, 49.0, 30.0, 44.0, 38.0, 51.0, 39.0, 39.0, 30.0, 33.0, 29.0, 21.0, 19.0, 26.0, 15.0, 15.0, 11.0, 16.0, 10.0, 3.0, 3.0, 7.0, 5.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.1640625, -9.845703125, -9.52734375, -9.208984375, -8.890625, -8.572265625, -8.25390625, -7.935546875, -7.6171875, -7.298828125, -6.98046875, -6.662109375, -6.34375, -6.025390625, -5.70703125, -5.388671875, -5.0703125, -4.751953125, -4.43359375, -4.115234375, -3.796875, -3.478515625, -3.16015625, -2.841796875, -2.5234375, -2.205078125, -1.88671875, -1.568359375, -1.25, -0.931640625, -0.61328125, -0.294921875, 0.0234375, 0.341796875, 0.66015625, 0.978515625, 1.296875, 1.615234375, 1.93359375, 2.251953125, 2.5703125, 2.888671875, 3.20703125, 3.525390625, 3.84375, 4.162109375, 4.48046875, 4.798828125, 5.1171875, 5.435546875, 5.75390625, 6.072265625, 6.390625, 6.708984375, 7.02734375, 7.345703125, 7.6640625, 7.982421875, 8.30078125, 8.619140625, 8.9375, 9.255859375, 9.57421875, 9.892578125, 10.2109375]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 6.0, 8.0, 19.0, 20.0, 24.0, 26.0, 48.0, 47.0, 83.0, 128.0, 229.0, 291.0, 621.0, 1157.0, 3142.0, 9748.0, 37649.0, 152973.0, 416517.0, 307544.0, 87256.0, 20917.0, 5848.0, 2129.0, 888.0, 446.0, 267.0, 154.0, 105.0, 80.0, 46.0, 31.0, 27.0, 24.0, 10.0, 8.0, 10.0, 4.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.8203125, -14.3228759765625, -13.825439453125, -13.3280029296875, -12.83056640625, -12.3331298828125, -11.835693359375, -11.3382568359375, -10.8408203125, -10.3433837890625, -9.845947265625, -9.3485107421875, -8.85107421875, -8.3536376953125, -7.856201171875, -7.3587646484375, -6.861328125, -6.3638916015625, -5.866455078125, -5.3690185546875, -4.87158203125, -4.3741455078125, -3.876708984375, -3.3792724609375, -2.8818359375, -2.3843994140625, -1.886962890625, -1.3895263671875, -0.89208984375, -0.3946533203125, 0.102783203125, 0.6002197265625, 1.09765625, 1.5950927734375, 2.092529296875, 2.5899658203125, 3.08740234375, 3.5848388671875, 4.082275390625, 4.5797119140625, 5.0771484375, 5.5745849609375, 6.072021484375, 6.5694580078125, 7.06689453125, 7.5643310546875, 8.061767578125, 8.5592041015625, 9.056640625, 9.5540771484375, 10.051513671875, 10.5489501953125, 11.04638671875, 11.5438232421875, 12.041259765625, 12.5386962890625, 13.0361328125, 13.5335693359375, 14.031005859375, 14.5284423828125, 15.02587890625, 15.5233154296875, 16.020751953125, 16.5181884765625, 17.015625]}, "gradients/decoder.model.decoder.layers.0.self_attn.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 4.0, 5.0, 4.0, 7.0, 11.0, 15.0, 19.0, 14.0, 13.0, 20.0, 23.0, 25.0, 24.0, 35.0, 51.0, 43.0, 49.0, 41.0, 52.0, 66.0, 59.0, 50.0, 37.0, 54.0, 41.0, 33.0, 29.0, 33.0, 19.0, 12.0, 17.0, 19.0, 11.0, 14.0, 13.0, 8.0, 8.0, 4.0, 7.0, 5.0, 4.0, 3.0, 0.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.390625, -11.969970703125, -11.54931640625, -11.128662109375, -10.7080078125, -10.287353515625, -9.86669921875, -9.446044921875, -9.025390625, -8.604736328125, -8.18408203125, -7.763427734375, -7.3427734375, -6.922119140625, -6.50146484375, -6.080810546875, -5.66015625, -5.239501953125, -4.81884765625, -4.398193359375, -3.9775390625, -3.556884765625, -3.13623046875, -2.715576171875, -2.294921875, -1.874267578125, -1.45361328125, -1.032958984375, -0.6123046875, -0.191650390625, 0.22900390625, 0.649658203125, 1.0703125, 1.490966796875, 1.91162109375, 2.332275390625, 2.7529296875, 3.173583984375, 3.59423828125, 4.014892578125, 4.435546875, 4.856201171875, 5.27685546875, 5.697509765625, 6.1181640625, 6.538818359375, 6.95947265625, 7.380126953125, 7.80078125, 8.221435546875, 8.64208984375, 9.062744140625, 9.4833984375, 9.904052734375, 10.32470703125, 10.745361328125, 11.166015625, 11.586669921875, 12.00732421875, 12.427978515625, 12.8486328125, 13.269287109375, 13.68994140625, 14.110595703125, 14.53125]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 6.0, 7.0, 9.0, 5.0, 20.0, 28.0, 38.0, 85.0, 139.0, 297.0, 573.0, 1190.0, 2793.0, 7001.0, 19526.0, 59501.0, 166851.0, 377770.0, 252193.0, 105786.0, 35048.0, 11738.0, 4393.0, 1863.0, 821.0, 400.0, 199.0, 107.0, 77.0, 27.0, 26.0, 16.0, 9.0, 3.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.763671875, -2.684173583984375, -2.60467529296875, -2.525177001953125, -2.4456787109375, -2.366180419921875, -2.28668212890625, -2.207183837890625, -2.127685546875, -2.048187255859375, -1.96868896484375, -1.889190673828125, -1.8096923828125, -1.730194091796875, -1.65069580078125, -1.571197509765625, -1.49169921875, -1.412200927734375, -1.33270263671875, -1.253204345703125, -1.1737060546875, -1.094207763671875, -1.01470947265625, -0.935211181640625, -0.855712890625, -0.776214599609375, -0.69671630859375, -0.617218017578125, -0.5377197265625, -0.458221435546875, -0.37872314453125, -0.299224853515625, -0.2197265625, -0.140228271484375, -0.06072998046875, 0.018768310546875, 0.0982666015625, 0.177764892578125, 0.25726318359375, 0.336761474609375, 0.416259765625, 0.495758056640625, 0.57525634765625, 0.654754638671875, 0.7342529296875, 0.813751220703125, 0.89324951171875, 0.972747802734375, 1.05224609375, 1.131744384765625, 1.21124267578125, 1.290740966796875, 1.3702392578125, 1.449737548828125, 1.52923583984375, 1.608734130859375, 1.688232421875, 1.767730712890625, 1.84722900390625, 1.926727294921875, 2.0062255859375, 2.085723876953125, 2.16522216796875, 2.244720458984375, 2.32421875]}, "gradients/decoder.model.decoder.layers.0.self_attn.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 2.0, 6.0, 10.0, 12.0, 12.0, 16.0, 22.0, 31.0, 35.0, 46.0, 43.0, 73.0, 84.0, 82.0, 141.0, 71.0, 56.0, 56.0, 42.0, 34.0, 36.0, 32.0, 15.0, 7.0, 9.0, 4.0, 11.0, 7.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005140304565429688, -0.0004953071475028992, -0.0004765838384628296, -0.00045786052942276, -0.00043913722038269043, -0.00042041391134262085, -0.00040169060230255127, -0.0003829672932624817, -0.0003642439842224121, -0.00034552067518234253, -0.00032679736614227295, -0.00030807405710220337, -0.0002893507480621338, -0.0002706274390220642, -0.00025190412998199463, -0.00023318082094192505, -0.00021445751190185547, -0.0001957342028617859, -0.0001770108938217163, -0.00015828758478164673, -0.00013956427574157715, -0.00012084096670150757, -0.00010211765766143799, -8.339434862136841e-05, -6.467103958129883e-05, -4.594773054122925e-05, -2.7224421501159668e-05, -8.501112461090088e-06, 1.0222196578979492e-05, 2.8945505619049072e-05, 4.766881465911865e-05, 6.639212369918823e-05, 8.511543273925781e-05, 0.00010383874177932739, 0.00012256205081939697, 0.00014128535985946655, 0.00016000866889953613, 0.0001787319779396057, 0.0001974552869796753, 0.00021617859601974487, 0.00023490190505981445, 0.00025362521409988403, 0.0002723485231399536, 0.0002910718321800232, 0.0003097951412200928, 0.00032851845026016235, 0.00034724175930023193, 0.0003659650683403015, 0.0003846883773803711, 0.0004034116864204407, 0.00042213499546051025, 0.00044085830450057983, 0.0004595816135406494, 0.000478304922580719, 0.0004970282316207886, 0.0005157515406608582, 0.0005344748497009277, 0.0005531981587409973, 0.0005719214677810669, 0.0005906447768211365, 0.0006093680858612061, 0.0006280913949012756, 0.0006468147039413452, 0.0006655380129814148, 0.0006842613220214844]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 6.0, 8.0, 7.0, 12.0, 21.0, 24.0, 41.0, 53.0, 56.0, 93.0, 110.0, 157.0, 200.0, 325.0, 437.0, 642.0, 950.0, 1533.0, 2693.0, 4632.0, 8854.0, 18532.0, 42275.0, 100806.0, 211074.0, 334659.0, 175592.0, 78995.0, 33404.0, 14829.0, 7294.0, 3735.0, 2278.0, 1366.0, 875.0, 563.0, 426.0, 283.0, 214.0, 125.0, 108.0, 71.0, 74.0, 26.0, 29.0, 24.0, 14.0, 11.0, 6.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0], "bins": [-2.6171875, -2.538726806640625, -2.46026611328125, -2.381805419921875, -2.3033447265625, -2.224884033203125, -2.14642333984375, -2.067962646484375, -1.989501953125, -1.911041259765625, -1.83258056640625, -1.754119873046875, -1.6756591796875, -1.597198486328125, -1.51873779296875, -1.440277099609375, -1.36181640625, -1.283355712890625, -1.20489501953125, -1.126434326171875, -1.0479736328125, -0.969512939453125, -0.89105224609375, -0.812591552734375, -0.734130859375, -0.655670166015625, -0.57720947265625, -0.498748779296875, -0.4202880859375, -0.341827392578125, -0.26336669921875, -0.184906005859375, -0.1064453125, -0.027984619140625, 0.05047607421875, 0.128936767578125, 0.2073974609375, 0.285858154296875, 0.36431884765625, 0.442779541015625, 0.521240234375, 0.599700927734375, 0.67816162109375, 0.756622314453125, 0.8350830078125, 0.913543701171875, 0.99200439453125, 1.070465087890625, 1.14892578125, 1.227386474609375, 1.30584716796875, 1.384307861328125, 1.4627685546875, 1.541229248046875, 1.61968994140625, 1.698150634765625, 1.776611328125, 1.855072021484375, 1.93353271484375, 2.011993408203125, 2.0904541015625, 2.168914794921875, 2.24737548828125, 2.325836181640625, 2.404296875]}, "gradients/decoder.model.decoder.layers.0.self_attn.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 3.0, 12.0, 15.0, 19.0, 21.0, 27.0, 37.0, 54.0, 56.0, 66.0, 75.0, 108.0, 119.0, 57.0, 79.0, 60.0, 44.0, 30.0, 30.0, 18.0, 22.0, 14.0, 9.0, 7.0, 3.0, 3.0, 0.0, 3.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.54296875, -2.4760589599609375, -2.409149169921875, -2.3422393798828125, -2.27532958984375, -2.2084197998046875, -2.141510009765625, -2.0746002197265625, -2.0076904296875, -1.9407806396484375, -1.873870849609375, -1.8069610595703125, -1.74005126953125, -1.6731414794921875, -1.606231689453125, -1.5393218994140625, -1.472412109375, -1.4055023193359375, -1.338592529296875, -1.2716827392578125, -1.20477294921875, -1.1378631591796875, -1.070953369140625, -1.0040435791015625, -0.9371337890625, -0.8702239990234375, -0.803314208984375, -0.7364044189453125, -0.66949462890625, -0.6025848388671875, -0.535675048828125, -0.4687652587890625, -0.40185546875, -0.3349456787109375, -0.268035888671875, -0.2011260986328125, -0.13421630859375, -0.0673065185546875, -0.000396728515625, 0.0665130615234375, 0.1334228515625, 0.2003326416015625, 0.267242431640625, 0.3341522216796875, 0.40106201171875, 0.4679718017578125, 0.534881591796875, 0.6017913818359375, 0.668701171875, 0.7356109619140625, 0.802520751953125, 0.8694305419921875, 0.93634033203125, 1.0032501220703125, 1.070159912109375, 1.1370697021484375, 1.2039794921875, 1.2708892822265625, 1.337799072265625, 1.4047088623046875, 1.47161865234375, 1.5385284423828125, 1.605438232421875, 1.6723480224609375, 1.7392578125]}, "gradients/decoder.model.decoder.layernorm_embedding.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 4.0, 5.0, 13.0, 28.0, 63.0, 77.0, 100.0, 138.0, 147.0, 140.0, 105.0, 68.0, 49.0, 34.0, 19.0, 7.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.04603576660156, -43.05390930175781, -42.0617790222168, -41.06965255737305, -40.07752227783203, -39.08539581298828, -38.09326934814453, -37.101139068603516, -36.109012603759766, -35.116886138916016, -34.124755859375, -33.13262939453125, -32.1405029296875, -31.148372650146484, -30.156246185302734, -29.16411781311035, -28.17198944091797, -27.179861068725586, -26.187732696533203, -25.195606231689453, -24.20347785949707, -23.211349487304688, -22.219223022460938, -21.227094650268555, -20.234966278076172, -19.24283790588379, -18.250709533691406, -17.258583068847656, -16.266454696655273, -15.27432632446289, -14.282198905944824, -13.290071487426758, -12.297943115234375, -11.305814743041992, -10.313687324523926, -9.32155990600586, -8.329431533813477, -7.337303638458252, -6.345175743103027, -5.353047847747803, -4.360919952392578, -3.3687920570373535, -2.376664161682129, -1.3845362663269043, -0.3924083709716797, 0.5997195243835449, 1.5918474197387695, 2.583975315093994, 3.5761032104492188, 4.568231105804443, 5.560359001159668, 6.552486896514893, 7.544614791870117, 8.5367431640625, 9.528870582580566, 10.520998001098633, 11.513126373291016, 12.505254745483398, 13.497382164001465, 14.489509582519531, 15.481637954711914, 16.473766326904297, 17.465892791748047, 18.45802116394043, 19.450149536132812]}, "gradients/decoder.model.decoder.layernorm_embedding.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 6.0, 13.0, 14.0, 13.0, 35.0, 22.0, 33.0, 29.0, 43.0, 30.0, 43.0, 61.0, 62.0, 64.0, 61.0, 43.0, 48.0, 54.0, 31.0, 37.0, 42.0, 28.0, 28.0, 18.0, 21.0, 14.0, 14.0, 11.0, 12.0, 9.0, 10.0, 12.0, 7.0, 6.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.78342628479004, -24.045886993408203, -23.308347702026367, -22.57080841064453, -21.833271026611328, -21.095731735229492, -20.358192443847656, -19.62065315246582, -18.883113861083984, -18.14557456970215, -17.408035278320312, -16.670495986938477, -15.932957649230957, -15.195418357849121, -14.457880020141602, -13.720340728759766, -12.98280143737793, -12.245262145996094, -11.507722854614258, -10.770184516906738, -10.032645225524902, -9.295105934143066, -8.557567596435547, -7.820028305053711, -7.082489013671875, -6.344949722290039, -5.607410907745361, -4.869872093200684, -4.132332801818848, -3.394793748855591, -2.657254695892334, -1.9197158813476562, -1.1821784973144531, -0.4446394443511963, 0.29289960861206055, 1.0304386615753174, 1.7679777145385742, 2.505516767501831, 3.243055820465088, 3.9805946350097656, 4.718133926391602, 5.4556732177734375, 6.193212032318115, 6.930750846862793, 7.668290138244629, 8.405829429626465, 9.143367767333984, 9.88090705871582, 10.618446350097656, 11.355985641479492, 12.093524932861328, 12.831063270568848, 13.568602561950684, 14.30614185333252, 15.043680191040039, 15.781219482421875, 16.51875877380371, 17.256298065185547, 17.993837356567383, 18.73137664794922, 19.468914031982422, 20.206453323364258, 20.943992614746094, 21.68153190612793, 22.419071197509766]}, "gradients/decoder.model.decoder.embed_positions.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 16.0, 7.0, 6.0, 14.0, 14.0, 34.0, 43.0, 64.0, 94.0, 120.0, 180.0, 285.0, 467.0, 722.0, 1086.0, 1549.0, 2341.0, 3404.0, 4911.0, 7582.0, 998325.0, 10302.0, 6187.0, 4219.0, 2844.0, 1950.0, 1279.0, 856.0, 534.0, 398.0, 227.0, 178.0, 119.0, 78.0, 51.0, 33.0, 24.0, 21.0, 14.0, 10.0, 10.0, 3.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.195330619812012, -14.717035293579102, -14.238740921020508, -13.760445594787598, -13.282150268554688, -12.803855895996094, -12.325560569763184, -11.847265243530273, -11.36897087097168, -10.89067554473877, -10.412381172180176, -9.934085845947266, -9.455791473388672, -8.977496147155762, -8.499200820922852, -8.020906448364258, -7.542611122131348, -7.064316272735596, -6.586021423339844, -6.107726097106934, -5.629431247711182, -5.15113639831543, -4.6728410720825195, -4.194546222686768, -3.7162513732910156, -3.2379565238952637, -2.7596614360809326, -2.2813663482666016, -1.8030714988708496, -1.3247766494750977, -0.8464815616607666, -0.36818647384643555, 0.110107421875, 0.5884023904800415, 1.066697359085083, 1.5449923276901245, 2.023287296295166, 2.501582145690918, 2.979877233505249, 3.45817232131958, 3.936467170715332, 4.414762020111084, 4.893056869506836, 5.371352195739746, 5.849647045135498, 6.32794189453125, 6.80623722076416, 7.284532070159912, 7.762826919555664, 8.241122245788574, 8.719416618347168, 9.197711944580078, 9.676006317138672, 10.154301643371582, 10.632596969604492, 11.110891342163086, 11.589186668395996, 12.067481994628906, 12.5457763671875, 13.02407169342041, 13.50236701965332, 13.980661392211914, 14.458956718444824, 14.937252044677734, 15.415546417236328]}, "gradients/decoder.model.decoder.embed_tokens.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 6.0, 6.0, 5.0, 20.0, 34.0, 117.0, 282.0, 760.0, 3637.0, 548646.0, 50911616.0, 4129.0, 758.0, 291.0, 115.0, 46.0, 27.0, 9.0, 10.0, 9.0, 3.0, 1.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-155.36744689941406, -149.61473083496094, -143.8620147705078, -138.1092987060547, -132.35658264160156, -126.60386657714844, -120.85115051269531, -115.09843444824219, -109.34571838378906, -103.59300231933594, -97.84028625488281, -92.08757019042969, -86.33485412597656, -80.58213806152344, -74.82942199707031, -69.07670593261719, -63.323997497558594, -57.57128143310547, -51.818565368652344, -46.06584930419922, -40.313133239746094, -34.56041717529297, -28.80770492553711, -23.054988861083984, -17.30227279663086, -11.549556732177734, -5.796841621398926, -0.04412651062011719, 5.708589553833008, 11.461305618286133, 17.214019775390625, 22.96673583984375, 28.719451904296875, 34.47216796875, 40.224884033203125, 45.97760009765625, 51.730316162109375, 57.4830322265625, 63.23574447631836, 68.98846435546875, 74.74118041992188, 80.493896484375, 86.24661254882812, 91.99932861328125, 97.75204467773438, 103.5047607421875, 109.25747680664062, 115.01019287109375, 120.76290130615234, 126.51561737060547, 132.26832580566406, 138.0210418701172, 143.7737579345703, 149.52647399902344, 155.27919006347656, 161.0319061279297, 166.7846221923828, 172.53733825683594, 178.29005432128906, 184.0427703857422, 189.7954864501953, 195.54820251464844, 201.30091857910156, 207.0536346435547, 212.8063507080078]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 6.0, 5.0, 12.0, 18.0, 24.0, 53.0, 58.0, 107.0, 162.0, 227.0, 346.0, 490.0, 743.0, 1130.0, 1494.0, 2218.0, 3401.0, 4958.0, 7691.0, 11600.0, 18091.0, 27938.0, 43585.0, 66736.0, 103008.0, 155127.0, 225872.0, 305215.0, 384129.0, 3523084.0, 395064.0, 312137.0, 231372.0, 160584.0, 106818.0, 68833.0, 45225.0, 28852.0, 18967.0, 12114.0, 7819.0, 5243.0, 3561.0, 2374.0, 1576.0, 1136.0, 752.0, 523.0, 348.0, 200.0, 153.0, 98.0, 61.0, 30.0, 31.0, 23.0, 10.0, 4.0, 7.0, 4.0, 4.0], "bins": [-5.1171875, -4.9599609375, -4.802734375, -4.6455078125, -4.48828125, -4.3310546875, -4.173828125, -4.0166015625, -3.859375, -3.7021484375, -3.544921875, -3.3876953125, -3.23046875, -3.0732421875, -2.916015625, -2.7587890625, -2.6015625, -2.4443359375, -2.287109375, -2.1298828125, -1.97265625, -1.8154296875, -1.658203125, -1.5009765625, -1.34375, -1.1865234375, -1.029296875, -0.8720703125, -0.71484375, -0.5576171875, -0.400390625, -0.2431640625, -0.0859375, 0.0712890625, 0.228515625, 0.3857421875, 0.54296875, 0.7001953125, 0.857421875, 1.0146484375, 1.171875, 1.3291015625, 1.486328125, 1.6435546875, 1.80078125, 1.9580078125, 2.115234375, 2.2724609375, 2.4296875, 2.5869140625, 2.744140625, 2.9013671875, 3.05859375, 3.2158203125, 3.373046875, 3.5302734375, 3.6875, 3.8447265625, 4.001953125, 4.1591796875, 4.31640625, 4.4736328125, 4.630859375, 4.7880859375, 4.9453125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 7.0, 7.0, 13.0, 7.0, 12.0, 22.0, 15.0, 29.0, 18.0, 24.0, 34.0, 33.0, 32.0, 39.0, 43.0, 48.0, 51.0, 1040.0, 84.0, 46.0, 45.0, 51.0, 30.0, 49.0, 28.0, 28.0, 37.0, 24.0, 14.0, 17.0, 20.0, 13.0, 12.0, 6.0, 5.0, 0.0, 8.0, 4.0, 7.0, 1.0, 0.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-119.5625, -115.78515625, -112.0078125, -108.23046875, -104.453125, -100.67578125, -96.8984375, -93.12109375, -89.34375, -85.56640625, -81.7890625, -78.01171875, -74.234375, -70.45703125, -66.6796875, -62.90234375, -59.125, -55.34765625, -51.5703125, -47.79296875, -44.015625, -40.23828125, -36.4609375, -32.68359375, -28.90625, -25.12890625, -21.3515625, -17.57421875, -13.796875, -10.01953125, -6.2421875, -2.46484375, 1.3125, 5.08984375, 8.8671875, 12.64453125, 16.421875, 20.19921875, 23.9765625, 27.75390625, 31.53125, 35.30859375, 39.0859375, 42.86328125, 46.640625, 50.41796875, 54.1953125, 57.97265625, 61.75, 65.52734375, 69.3046875, 73.08203125, 76.859375, 80.63671875, 84.4140625, 88.19140625, 91.96875, 95.74609375, 99.5234375, 103.30078125, 107.078125, 110.85546875, 114.6328125, 118.41015625, 122.1875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 8.0, 1.0, 7.0, 8.0, 17.0, 31.0, 44.0, 68.0, 83.0, 123.0, 155.0, 302.0, 409.0, 687.0, 1063.0, 1722.0, 2731.0, 4342.0, 7298.0, 12055.0, 20489.0, 35050.0, 60011.0, 102101.0, 170606.0, 265826.0, 376977.0, 977179.0, 3099922.0, 398512.0, 289631.0, 187021.0, 113852.0, 66828.0, 38888.0, 22898.0, 13700.0, 8045.0, 4937.0, 2987.0, 1815.0, 1135.0, 659.0, 437.0, 277.0, 161.0, 113.0, 85.0, 77.0, 26.0, 24.0, 11.0, 5.0, 3.0, 1.0, 1.0, 2.0], "bins": [-6.2109375, -6.03399658203125, -5.8570556640625, -5.68011474609375, -5.503173828125, -5.32623291015625, -5.1492919921875, -4.97235107421875, -4.79541015625, -4.61846923828125, -4.4415283203125, -4.26458740234375, -4.087646484375, -3.91070556640625, -3.7337646484375, -3.55682373046875, -3.3798828125, -3.20294189453125, -3.0260009765625, -2.84906005859375, -2.672119140625, -2.49517822265625, -2.3182373046875, -2.14129638671875, -1.96435546875, -1.78741455078125, -1.6104736328125, -1.43353271484375, -1.256591796875, -1.07965087890625, -0.9027099609375, -0.72576904296875, -0.548828125, -0.37188720703125, -0.1949462890625, -0.01800537109375, 0.158935546875, 0.33587646484375, 0.5128173828125, 0.68975830078125, 0.86669921875, 1.04364013671875, 1.2205810546875, 1.39752197265625, 1.574462890625, 1.75140380859375, 1.9283447265625, 2.10528564453125, 2.2822265625, 2.45916748046875, 2.6361083984375, 2.81304931640625, 2.989990234375, 3.16693115234375, 3.3438720703125, 3.52081298828125, 3.69775390625, 3.87469482421875, 4.0516357421875, 4.22857666015625, 4.405517578125, 4.58245849609375, 4.7593994140625, 4.93634033203125, 5.11328125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 9.0, 5.0, 4.0, 9.0, 7.0, 9.0, 8.0, 11.0, 18.0, 29.0, 14.0, 24.0, 29.0, 26.0, 38.0, 31.0, 32.0, 49.0, 39.0, 39.0, 46.0, 1029.0, 85.0, 46.0, 34.0, 43.0, 31.0, 35.0, 35.0, 36.0, 24.0, 31.0, 12.0, 21.0, 19.0, 13.0, 12.0, 16.0, 9.0, 7.0, 4.0, 2.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-108.75, -105.7021484375, -102.654296875, -99.6064453125, -96.55859375, -93.5107421875, -90.462890625, -87.4150390625, -84.3671875, -81.3193359375, -78.271484375, -75.2236328125, -72.17578125, -69.1279296875, -66.080078125, -63.0322265625, -59.984375, -56.9365234375, -53.888671875, -50.8408203125, -47.79296875, -44.7451171875, -41.697265625, -38.6494140625, -35.6015625, -32.5537109375, -29.505859375, -26.4580078125, -23.41015625, -20.3623046875, -17.314453125, -14.2666015625, -11.21875, -8.1708984375, -5.123046875, -2.0751953125, 0.97265625, 4.0205078125, 7.068359375, 10.1162109375, 13.1640625, 16.2119140625, 19.259765625, 22.3076171875, 25.35546875, 28.4033203125, 31.451171875, 34.4990234375, 37.546875, 40.5947265625, 43.642578125, 46.6904296875, 49.73828125, 52.7861328125, 55.833984375, 58.8818359375, 61.9296875, 64.9775390625, 68.025390625, 71.0732421875, 74.12109375, 77.1689453125, 80.216796875, 83.2646484375, 86.3125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 6.0, 6.0, 18.0, 18.0, 14.0, 18.0, 23.0, 31.0, 36.0, 76.0, 109.0, 193.0, 268.0, 324.0, 637.0, 1154.0, 2038.0, 3722.0, 7090.0, 13550.0, 26173.0, 50961.0, 98991.0, 693336.0, 5177059.0, 104227.0, 53022.0, 27207.0, 14381.0, 7463.0, 4033.0, 2111.0, 1225.0, 753.0, 426.0, 246.0, 182.0, 85.0, 62.0, 48.0, 37.0, 27.0, 25.0, 15.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-16.0625, -15.489501953125, -14.91650390625, -14.343505859375, -13.7705078125, -13.197509765625, -12.62451171875, -12.051513671875, -11.478515625, -10.905517578125, -10.33251953125, -9.759521484375, -9.1865234375, -8.613525390625, -8.04052734375, -7.467529296875, -6.89453125, -6.321533203125, -5.74853515625, -5.175537109375, -4.6025390625, -4.029541015625, -3.45654296875, -2.883544921875, -2.310546875, -1.737548828125, -1.16455078125, -0.591552734375, -0.0185546875, 0.554443359375, 1.12744140625, 1.700439453125, 2.2734375, 2.846435546875, 3.41943359375, 3.992431640625, 4.5654296875, 5.138427734375, 5.71142578125, 6.284423828125, 6.857421875, 7.430419921875, 8.00341796875, 8.576416015625, 9.1494140625, 9.722412109375, 10.29541015625, 10.868408203125, 11.44140625, 12.014404296875, 12.58740234375, 13.160400390625, 13.7333984375, 14.306396484375, 14.87939453125, 15.452392578125, 16.025390625, 16.598388671875, 17.17138671875, 17.744384765625, 18.3173828125, 18.890380859375, 19.46337890625, 20.036376953125, 20.609375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 9.0, 4.0, 7.0, 12.0, 9.0, 10.0, 16.0, 21.0, 20.0, 27.0, 32.0, 32.0, 36.0, 53.0, 39.0, 46.0, 48.0, 39.0, 88.0, 1020.0, 47.0, 52.0, 40.0, 33.0, 35.0, 29.0, 32.0, 38.0, 27.0, 13.0, 27.0, 15.0, 18.0, 15.0, 8.0, 6.0, 5.0, 6.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-107.1875, -104.1455078125, -101.103515625, -98.0615234375, -95.01953125, -91.9775390625, -88.935546875, -85.8935546875, -82.8515625, -79.8095703125, -76.767578125, -73.7255859375, -70.68359375, -67.6416015625, -64.599609375, -61.5576171875, -58.515625, -55.4736328125, -52.431640625, -49.3896484375, -46.34765625, -43.3056640625, -40.263671875, -37.2216796875, -34.1796875, -31.1376953125, -28.095703125, -25.0537109375, -22.01171875, -18.9697265625, -15.927734375, -12.8857421875, -9.84375, -6.8017578125, -3.759765625, -0.7177734375, 2.32421875, 5.3662109375, 8.408203125, 11.4501953125, 14.4921875, 17.5341796875, 20.576171875, 23.6181640625, 26.66015625, 29.7021484375, 32.744140625, 35.7861328125, 38.828125, 41.8701171875, 44.912109375, 47.9541015625, 50.99609375, 54.0380859375, 57.080078125, 60.1220703125, 63.1640625, 66.2060546875, 69.248046875, 72.2900390625, 75.33203125, 78.3740234375, 81.416015625, 84.4580078125, 87.5]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 13.0, 26.0, 82.0, 204.0, 332.0, 184.0, 81.0, 35.0, 17.0, 4.0, 6.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-135.7132568359375, -129.08135986328125, -122.449462890625, -115.81756591796875, -109.1856689453125, -102.55377197265625, -95.921875, -89.28997802734375, -82.6580810546875, -76.02618408203125, -69.394287109375, -62.76239013671875, -56.1304931640625, -49.49859619140625, -42.86669921875, -36.23480224609375, -29.6029052734375, -22.97100830078125, -16.339111328125, -9.70721435546875, -3.0753173828125, 3.55657958984375, 10.1884765625, 16.82037353515625, 23.4522705078125, 30.08416748046875, 36.716064453125, 43.34796142578125, 49.9798583984375, 56.61175537109375, 63.24365234375, 69.87554931640625, 76.5074462890625, 83.13934326171875, 89.771240234375, 96.40313720703125, 103.0350341796875, 109.66693115234375, 116.298828125, 122.93072509765625, 129.5626220703125, 136.19451904296875, 142.826416015625, 149.45831298828125, 156.0902099609375, 162.72210693359375, 169.35400390625, 175.98590087890625, 182.6177978515625, 189.24969482421875, 195.881591796875, 202.51348876953125, 209.1453857421875, 215.77728271484375, 222.4091796875, 229.04107666015625, 235.6729736328125, 242.30487060546875, 248.936767578125, 255.56866455078125, 262.2005615234375, 268.83245849609375, 275.46435546875, 282.09625244140625, 288.7281494140625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 6.0, 17.0, 14.0, 14.0, 14.0, 23.0, 31.0, 38.0, 38.0, 50.0, 46.0, 58.0, 64.0, 59.0, 51.0, 66.0, 54.0, 49.0, 50.0, 47.0, 29.0, 27.0, 32.0, 24.0, 14.0, 20.0, 9.0, 8.0, 7.0, 4.0, 5.0, 2.0, 2.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-216.37127685546875, -209.51707458496094, -202.66285705566406, -195.80865478515625, -188.95445251464844, -182.10025024414062, -175.24603271484375, -168.39183044433594, -161.53762817382812, -154.6834259033203, -147.82920837402344, -140.97500610351562, -134.1208038330078, -127.26659393310547, -120.41238403320312, -113.55818176269531, -106.70397186279297, -99.84976196289062, -92.99555969238281, -86.14134979248047, -79.28714752197266, -72.43293762207031, -65.5787353515625, -58.724525451660156, -51.87031936645508, -45.01611328125, -38.16190719604492, -31.30769920349121, -24.453493118286133, -17.599285125732422, -10.745079040527344, -3.8908729553222656, 2.9633331298828125, 9.81753921508789, 16.67174530029297, 23.52595329284668, 30.380159378051758, 37.23436737060547, 44.08857345581055, 50.942779541015625, 57.7969856262207, 64.65119171142578, 71.50540161132812, 78.35960388183594, 85.21381378173828, 92.06802368164062, 98.92222595214844, 105.77642822265625, 112.6306381225586, 119.48484802246094, 126.33905029296875, 133.19325256347656, 140.04747009277344, 146.90167236328125, 153.75587463378906, 160.61007690429688, 167.46429443359375, 174.31849670410156, 181.17271423339844, 188.02691650390625, 194.88111877441406, 201.73532104492188, 208.58953857421875, 215.44374084472656, 222.29794311523438]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 6.0, 8.0, 12.0, 9.0, 18.0, 16.0, 20.0, 42.0, 55.0, 79.0, 135.0, 194.0, 318.0, 511.0, 908.0, 1795.0, 3757.0, 10023.0, 40017.0, 3955508.0, 143474.0, 22202.0, 7639.0, 3323.0, 1640.0, 971.0, 570.0, 321.0, 233.0, 142.0, 82.0, 63.0, 50.0, 33.0, 16.0, 24.0, 15.0, 11.0, 14.0, 9.0, 6.0, 2.0, 7.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8798828125, -1.8145599365234375, -1.749237060546875, -1.6839141845703125, -1.61859130859375, -1.5532684326171875, -1.487945556640625, -1.4226226806640625, -1.3572998046875, -1.2919769287109375, -1.226654052734375, -1.1613311767578125, -1.09600830078125, -1.0306854248046875, -0.965362548828125, -0.9000396728515625, -0.834716796875, -0.7693939208984375, -0.704071044921875, -0.6387481689453125, -0.57342529296875, -0.5081024169921875, -0.442779541015625, -0.3774566650390625, -0.3121337890625, -0.2468109130859375, -0.181488037109375, -0.1161651611328125, -0.05084228515625, 0.0144805908203125, 0.079803466796875, 0.1451263427734375, 0.21044921875, 0.2757720947265625, 0.341094970703125, 0.4064178466796875, 0.47174072265625, 0.5370635986328125, 0.602386474609375, 0.6677093505859375, 0.7330322265625, 0.7983551025390625, 0.863677978515625, 0.9290008544921875, 0.99432373046875, 1.0596466064453125, 1.124969482421875, 1.1902923583984375, 1.255615234375, 1.3209381103515625, 1.386260986328125, 1.4515838623046875, 1.51690673828125, 1.5822296142578125, 1.647552490234375, 1.7128753662109375, 1.7781982421875, 1.8435211181640625, 1.908843994140625, 1.9741668701171875, 2.03948974609375, 2.1048126220703125, 2.170135498046875, 2.2354583740234375, 2.30078125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 2.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 9.0, 13.0, 5.0, 7.0, 7.0, 17.0, 15.0, 22.0, 714.0, 64.0, 12.0, 10.0, 13.0, 9.0, 7.0, 7.0, 9.0, 9.0, 6.0, 2.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0244140625, -0.9902191162109375, -0.956024169921875, -0.9218292236328125, -0.88763427734375, -0.8534393310546875, -0.819244384765625, -0.7850494384765625, -0.7508544921875, -0.7166595458984375, -0.682464599609375, -0.6482696533203125, -0.61407470703125, -0.5798797607421875, -0.545684814453125, -0.5114898681640625, -0.477294921875, -0.4430999755859375, -0.408905029296875, -0.3747100830078125, -0.34051513671875, -0.3063201904296875, -0.272125244140625, -0.2379302978515625, -0.2037353515625, -0.1695404052734375, -0.135345458984375, -0.1011505126953125, -0.06695556640625, -0.0327606201171875, 0.001434326171875, 0.0356292724609375, 0.06982421875, 0.1040191650390625, 0.138214111328125, 0.1724090576171875, 0.20660400390625, 0.2407989501953125, 0.274993896484375, 0.3091888427734375, 0.3433837890625, 0.3775787353515625, 0.411773681640625, 0.4459686279296875, 0.48016357421875, 0.5143585205078125, 0.548553466796875, 0.5827484130859375, 0.616943359375, 0.6511383056640625, 0.685333251953125, 0.7195281982421875, 0.75372314453125, 0.7879180908203125, 0.822113037109375, 0.8563079833984375, 0.8905029296875, 0.9246978759765625, 0.958892822265625, 0.9930877685546875, 1.02728271484375, 1.0614776611328125, 1.095672607421875, 1.1298675537109375, 1.1640625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 1.0, 6.0, 7.0, 5.0, 9.0, 3.0, 11.0, 13.0, 14.0, 24.0, 32.0, 38.0, 50.0, 84.0, 136.0, 224.0, 364.0, 677.0, 1031.0, 2129.0, 4452.0, 10734.0, 32862.0, 166143.0, 3275171.0, 608903.0, 62774.0, 16454.0, 5963.0, 2686.0, 1346.0, 729.0, 408.0, 262.0, 169.0, 118.0, 75.0, 49.0, 37.0, 21.0, 25.0, 11.0, 3.0, 8.0, 10.0, 12.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2041015625, -1.1622161865234375, -1.120330810546875, -1.0784454345703125, -1.03656005859375, -0.9946746826171875, -0.952789306640625, -0.9109039306640625, -0.8690185546875, -0.8271331787109375, -0.785247802734375, -0.7433624267578125, -0.70147705078125, -0.6595916748046875, -0.617706298828125, -0.5758209228515625, -0.533935546875, -0.4920501708984375, -0.450164794921875, -0.4082794189453125, -0.36639404296875, -0.3245086669921875, -0.282623291015625, -0.2407379150390625, -0.1988525390625, -0.1569671630859375, -0.115081787109375, -0.0731964111328125, -0.03131103515625, 0.0105743408203125, 0.052459716796875, 0.0943450927734375, 0.13623046875, 0.1781158447265625, 0.220001220703125, 0.2618865966796875, 0.30377197265625, 0.3456573486328125, 0.387542724609375, 0.4294281005859375, 0.4713134765625, 0.5131988525390625, 0.555084228515625, 0.5969696044921875, 0.63885498046875, 0.6807403564453125, 0.722625732421875, 0.7645111083984375, 0.806396484375, 0.8482818603515625, 0.890167236328125, 0.9320526123046875, 0.97393798828125, 1.0158233642578125, 1.057708740234375, 1.0995941162109375, 1.1414794921875, 1.1833648681640625, 1.225250244140625, 1.2671356201171875, 1.30902099609375, 1.3509063720703125, 1.392791748046875, 1.4346771240234375, 1.4765625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 10.0, 12.0, 6.0, 15.0, 26.0, 27.0, 42.0, 53.0, 96.0, 158.0, 292.0, 776.0, 1554.0, 444.0, 211.0, 113.0, 72.0, 50.0, 28.0, 17.0, 13.0, 16.0, 9.0, 6.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9072265625, -0.8762359619140625, -0.845245361328125, -0.8142547607421875, -0.78326416015625, -0.7522735595703125, -0.721282958984375, -0.6902923583984375, -0.6593017578125, -0.6283111572265625, -0.597320556640625, -0.5663299560546875, -0.53533935546875, -0.5043487548828125, -0.473358154296875, -0.4423675537109375, -0.411376953125, -0.3803863525390625, -0.349395751953125, -0.3184051513671875, -0.28741455078125, -0.2564239501953125, -0.225433349609375, -0.1944427490234375, -0.1634521484375, -0.1324615478515625, -0.101470947265625, -0.0704803466796875, -0.03948974609375, -0.0084991455078125, 0.022491455078125, 0.0534820556640625, 0.08447265625, 0.1154632568359375, 0.146453857421875, 0.1774444580078125, 0.20843505859375, 0.2394256591796875, 0.270416259765625, 0.3014068603515625, 0.3323974609375, 0.3633880615234375, 0.394378662109375, 0.4253692626953125, 0.45635986328125, 0.4873504638671875, 0.518341064453125, 0.5493316650390625, 0.580322265625, 0.6113128662109375, 0.642303466796875, 0.6732940673828125, 0.70428466796875, 0.7352752685546875, 0.766265869140625, 0.7972564697265625, 0.8282470703125, 0.8592376708984375, 0.890228271484375, 0.9212188720703125, 0.95220947265625, 0.9832000732421875, 1.014190673828125, 1.0451812744140625, 1.076171875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 3.0, 12.0, 34.0, 83.0, 307.0, 387.0, 127.0, 36.0, 12.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.033174514770508, -9.833477973937988, -9.633781433105469, -9.434085845947266, -9.234389305114746, -9.034692764282227, -8.834996223449707, -8.635299682617188, -8.435604095458984, -8.235907554626465, -8.036211013793945, -7.836514949798584, -7.636818885803223, -7.437122344970703, -7.237425804138184, -7.037729740142822, -6.838033199310303, -6.638336658477783, -6.438640594482422, -6.238944053649902, -6.039247989654541, -5.8395514488220215, -5.63985538482666, -5.440158843994141, -5.240462303161621, -5.040765762329102, -4.84106969833374, -4.641373157501221, -4.441677093505859, -4.24198055267334, -4.04228401184082, -3.842587947845459, -3.642892360687256, -3.4431960582733154, -3.243499755859375, -3.0438032150268555, -2.844107151031494, -2.6444106101989746, -2.444714307785034, -2.2450180053710938, -2.0453217029571533, -1.845625400543213, -1.6459290981292725, -1.4462326765060425, -1.246536374092102, -1.0468400716781616, -0.8471436500549316, -0.6474473476409912, -0.4477510452270508, -0.24805471301078796, -0.048358380794525146, 0.15133798122406006, 0.3510342836380005, 0.5507305860519409, 0.7504270076751709, 0.9501233100891113, 1.1498196125030518, 1.3495159149169922, 1.5492122173309326, 1.7489086389541626, 1.948604941368103, 2.148301124572754, 2.3479976654052734, 2.547693967819214, 2.7473902702331543]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 4.0, 0.0, 4.0, 2.0, 6.0, 3.0, 8.0, 8.0, 14.0, 19.0, 21.0, 23.0, 32.0, 30.0, 37.0, 50.0, 48.0, 58.0, 60.0, 71.0, 56.0, 50.0, 44.0, 69.0, 54.0, 49.0, 39.0, 32.0, 23.0, 27.0, 15.0, 10.0, 6.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.3316245079040527, -3.231184959411621, -3.1307456493377686, -3.030306100845337, -2.9298665523529053, -2.8294272422790527, -2.728987693786621, -2.6285481452941895, -2.528108596801758, -2.427669048309326, -2.3272297382354736, -2.226790189743042, -2.1263506412506104, -2.025911331176758, -1.9254717826843262, -1.8250322341918945, -1.724592924118042, -1.6241534948349, -1.5237139463424683, -1.4232745170593262, -1.3228349685668945, -1.2223955392837524, -1.1219561100006104, -1.0215165615081787, -0.9210771322250366, -0.8206376433372498, -0.7201981544494629, -0.6197587251663208, -0.5193192362785339, -0.41887974739074707, -0.318440318107605, -0.21800082921981812, -0.11756134033203125, -0.01712186634540558, 0.08331760764122009, 0.18375706672668457, 0.28419655561447144, 0.3846360445022583, 0.4850754737854004, 0.5855149626731873, 0.6859544515609741, 0.786393940448761, 0.8868334293365479, 0.9872728586196899, 1.087712287902832, 1.1881518363952637, 1.2885912656784058, 1.3890306949615479, 1.4894702434539795, 1.5899096727371216, 1.6903492212295532, 1.7907886505126953, 1.891228199005127, 1.991667628288269, 2.092107057571411, 2.1925466060638428, 2.2929859161376953, 2.393425464630127, 2.4938647747039795, 2.594304323196411, 2.6947438716888428, 2.7951831817626953, 2.895622730255127, 2.9960622787475586, 3.0965018272399902]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 9.0, 6.0, 4.0, 11.0, 11.0, 17.0, 18.0, 32.0, 26.0, 53.0, 60.0, 76.0, 112.0, 125.0, 178.0, 223.0, 298.0, 407.0, 577.0, 755.0, 1082.0, 1566.0, 2296.0, 3521.0, 5685.0, 9704.0, 17519.0, 37772.0, 857979.0, 55408.0, 21977.0, 11438.0, 6596.0, 4071.0, 2667.0, 1822.0, 1242.0, 792.0, 618.0, 454.0, 320.0, 259.0, 169.0, 159.0, 107.0, 88.0, 66.0, 42.0, 26.0, 36.0, 21.0, 17.0, 16.0, 9.0, 5.0, 10.0, 1.0, 2.0, 4.0, 1.0, 2.0], "bins": [-3.68359375, -3.567230224609375, -3.45086669921875, -3.334503173828125, -3.2181396484375, -3.101776123046875, -2.98541259765625, -2.869049072265625, -2.752685546875, -2.636322021484375, -2.51995849609375, -2.403594970703125, -2.2872314453125, -2.170867919921875, -2.05450439453125, -1.938140869140625, -1.82177734375, -1.705413818359375, -1.58905029296875, -1.472686767578125, -1.3563232421875, -1.239959716796875, -1.12359619140625, -1.007232666015625, -0.890869140625, -0.774505615234375, -0.65814208984375, -0.541778564453125, -0.4254150390625, -0.309051513671875, -0.19268798828125, -0.076324462890625, 0.0400390625, 0.156402587890625, 0.27276611328125, 0.389129638671875, 0.5054931640625, 0.621856689453125, 0.73822021484375, 0.854583740234375, 0.970947265625, 1.087310791015625, 1.20367431640625, 1.320037841796875, 1.4364013671875, 1.552764892578125, 1.66912841796875, 1.785491943359375, 1.90185546875, 2.018218994140625, 2.13458251953125, 2.250946044921875, 2.3673095703125, 2.483673095703125, 2.60003662109375, 2.716400146484375, 2.832763671875, 2.949127197265625, 3.06549072265625, 3.181854248046875, 3.2982177734375, 3.414581298828125, 3.53094482421875, 3.647308349609375, 3.763671875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 3.0, 3.0, 7.0, 13.0, 11.0, 2.0, 11.0, 2.0, 14.0, 17.0, 17.0, 385.0, 395.0, 16.0, 9.0, 9.0, 13.0, 9.0, 6.0, 5.0, 9.0, 10.0, 2.0, 2.0, 9.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.97900390625, -0.9464797973632812, -0.9139556884765625, -0.8814315795898438, -0.848907470703125, -0.8163833618164062, -0.7838592529296875, -0.7513351440429688, -0.71881103515625, -0.6862869262695312, -0.6537628173828125, -0.6212387084960938, -0.588714599609375, -0.5561904907226562, -0.5236663818359375, -0.49114227294921875, -0.4586181640625, -0.42609405517578125, -0.3935699462890625, -0.36104583740234375, -0.328521728515625, -0.29599761962890625, -0.2634735107421875, -0.23094940185546875, -0.19842529296875, -0.16590118408203125, -0.1333770751953125, -0.10085296630859375, -0.068328857421875, -0.03580474853515625, -0.0032806396484375, 0.02924346923828125, 0.061767578125, 0.09429168701171875, 0.1268157958984375, 0.15933990478515625, 0.191864013671875, 0.22438812255859375, 0.2569122314453125, 0.28943634033203125, 0.32196044921875, 0.35448455810546875, 0.3870086669921875, 0.41953277587890625, 0.452056884765625, 0.48458099365234375, 0.5171051025390625, 0.5496292114257812, 0.5821533203125, 0.6146774291992188, 0.6472015380859375, 0.6797256469726562, 0.712249755859375, 0.7447738647460938, 0.7772979736328125, 0.8098220825195312, 0.84234619140625, 0.8748703002929688, 0.9073944091796875, 0.9399185180664062, 0.972442626953125, 1.0049667358398438, 1.0374908447265625, 1.0700149536132812, 1.1025390625]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 2.0, 9.0, 3.0, 8.0, 17.0, 18.0, 31.0, 37.0, 55.0, 82.0, 91.0, 147.0, 242.0, 373.0, 665.0, 1286.0, 2859.0, 6926.0, 20540.0, 78535.0, 449112.0, 387864.0, 69209.0, 18580.0, 6301.0, 2595.0, 1222.0, 646.0, 341.0, 237.0, 155.0, 98.0, 77.0, 56.0, 33.0, 28.0, 17.0, 7.0, 10.0, 13.0, 3.0, 5.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.63671875, -3.532684326171875, -3.42864990234375, -3.324615478515625, -3.2205810546875, -3.116546630859375, -3.01251220703125, -2.908477783203125, -2.804443359375, -2.700408935546875, -2.59637451171875, -2.492340087890625, -2.3883056640625, -2.284271240234375, -2.18023681640625, -2.076202392578125, -1.97216796875, -1.868133544921875, -1.76409912109375, -1.660064697265625, -1.5560302734375, -1.451995849609375, -1.34796142578125, -1.243927001953125, -1.139892578125, -1.035858154296875, -0.93182373046875, -0.827789306640625, -0.7237548828125, -0.619720458984375, -0.51568603515625, -0.411651611328125, -0.3076171875, -0.203582763671875, -0.09954833984375, 0.004486083984375, 0.1085205078125, 0.212554931640625, 0.31658935546875, 0.420623779296875, 0.524658203125, 0.628692626953125, 0.73272705078125, 0.836761474609375, 0.9407958984375, 1.044830322265625, 1.14886474609375, 1.252899169921875, 1.35693359375, 1.460968017578125, 1.56500244140625, 1.669036865234375, 1.7730712890625, 1.877105712890625, 1.98114013671875, 2.085174560546875, 2.189208984375, 2.293243408203125, 2.39727783203125, 2.501312255859375, 2.6053466796875, 2.709381103515625, 2.81341552734375, 2.917449951171875, 3.021484375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 7.0, 4.0, 6.0, 2.0, 7.0, 3.0, 7.0, 12.0, 6.0, 17.0, 12.0, 17.0, 22.0, 22.0, 29.0, 27.0, 26.0, 32.0, 45.0, 35.0, 50.0, 46.0, 35.0, 43.0, 53.0, 42.0, 53.0, 41.0, 33.0, 27.0, 38.0, 31.0, 29.0, 25.0, 17.0, 19.0, 17.0, 18.0, 14.0, 5.0, 7.0, 9.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.98046875, -3.84539794921875, -3.7103271484375, -3.57525634765625, -3.440185546875, -3.30511474609375, -3.1700439453125, -3.03497314453125, -2.89990234375, -2.76483154296875, -2.6297607421875, -2.49468994140625, -2.359619140625, -2.22454833984375, -2.0894775390625, -1.95440673828125, -1.8193359375, -1.68426513671875, -1.5491943359375, -1.41412353515625, -1.279052734375, -1.14398193359375, -1.0089111328125, -0.87384033203125, -0.73876953125, -0.60369873046875, -0.4686279296875, -0.33355712890625, -0.198486328125, -0.06341552734375, 0.0716552734375, 0.20672607421875, 0.341796875, 0.47686767578125, 0.6119384765625, 0.74700927734375, 0.882080078125, 1.01715087890625, 1.1522216796875, 1.28729248046875, 1.42236328125, 1.55743408203125, 1.6925048828125, 1.82757568359375, 1.962646484375, 2.09771728515625, 2.2327880859375, 2.36785888671875, 2.5029296875, 2.63800048828125, 2.7730712890625, 2.90814208984375, 3.043212890625, 3.17828369140625, 3.3133544921875, 3.44842529296875, 3.58349609375, 3.71856689453125, 3.8536376953125, 3.98870849609375, 4.123779296875, 4.25885009765625, 4.3939208984375, 4.52899169921875, 4.6640625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 17.0, 23.0, 32.0, 52.0, 109.0, 264.0, 757.0, 4203.0, 523739.0, 513900.0, 4165.0, 782.0, 242.0, 112.0, 63.0, 35.0, 15.0, 11.0, 5.0, 2.0, 4.0, 6.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.671875, -22.118896484375, -21.56591796875, -21.012939453125, -20.4599609375, -19.906982421875, -19.35400390625, -18.801025390625, -18.248046875, -17.695068359375, -17.14208984375, -16.589111328125, -16.0361328125, -15.483154296875, -14.93017578125, -14.377197265625, -13.82421875, -13.271240234375, -12.71826171875, -12.165283203125, -11.6123046875, -11.059326171875, -10.50634765625, -9.953369140625, -9.400390625, -8.847412109375, -8.29443359375, -7.741455078125, -7.1884765625, -6.635498046875, -6.08251953125, -5.529541015625, -4.9765625, -4.423583984375, -3.87060546875, -3.317626953125, -2.7646484375, -2.211669921875, -1.65869140625, -1.105712890625, -0.552734375, 0.000244140625, 0.55322265625, 1.106201171875, 1.6591796875, 2.212158203125, 2.76513671875, 3.318115234375, 3.87109375, 4.424072265625, 4.97705078125, 5.530029296875, 6.0830078125, 6.635986328125, 7.18896484375, 7.741943359375, 8.294921875, 8.847900390625, 9.40087890625, 9.953857421875, 10.5068359375, 11.059814453125, 11.61279296875, 12.165771484375, 12.71875]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 6.0, 3.0, 5.0, 7.0, 13.0, 26.0, 22.0, 42.0, 80.0, 144.0, 235.0, 175.0, 96.0, 53.0, 22.0, 14.0, 20.0, 6.0, 6.0, 7.0, 8.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00027251243591308594, -0.00026417896151542664, -0.00025584548711776733, -0.00024751201272010803, -0.00023917853832244873, -0.00023084506392478943, -0.00022251158952713013, -0.00021417811512947083, -0.00020584464073181152, -0.00019751116633415222, -0.00018917769193649292, -0.00018084421753883362, -0.00017251074314117432, -0.00016417726874351501, -0.0001558437943458557, -0.0001475103199481964, -0.0001391768455505371, -0.0001308433711528778, -0.0001225098967552185, -0.0001141764223575592, -0.0001058429479598999, -9.75094735622406e-05, -8.91759991645813e-05, -8.0842524766922e-05, -7.25090503692627e-05, -6.41755759716034e-05, -5.584210157394409e-05, -4.750862717628479e-05, -3.917515277862549e-05, -3.0841678380966187e-05, -2.2508203983306885e-05, -1.4174729585647583e-05, -5.841255187988281e-06, 2.4922192096710205e-06, 1.0825693607330322e-05, 1.9159168004989624e-05, 2.7492642402648926e-05, 3.582611680030823e-05, 4.415959119796753e-05, 5.249306559562683e-05, 6.082653999328613e-05, 6.916001439094543e-05, 7.749348878860474e-05, 8.582696318626404e-05, 9.416043758392334e-05, 0.00010249391198158264, 0.00011082738637924194, 0.00011916086077690125, 0.00012749433517456055, 0.00013582780957221985, 0.00014416128396987915, 0.00015249475836753845, 0.00016082823276519775, 0.00016916170716285706, 0.00017749518156051636, 0.00018582865595817566, 0.00019416213035583496, 0.00020249560475349426, 0.00021082907915115356, 0.00021916255354881287, 0.00022749602794647217, 0.00023582950234413147, 0.00024416297674179077, 0.0002524964511394501, 0.0002608299255371094]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 14.0, 17.0, 32.0, 55.0, 128.0, 277.0, 932.0, 4104.0, 57615.0, 953358.0, 28063.0, 2865.0, 652.0, 224.0, 103.0, 53.0, 17.0, 10.0, 11.0, 1.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.0703125, -9.814697265625, -9.55908203125, -9.303466796875, -9.0478515625, -8.792236328125, -8.53662109375, -8.281005859375, -8.025390625, -7.769775390625, -7.51416015625, -7.258544921875, -7.0029296875, -6.747314453125, -6.49169921875, -6.236083984375, -5.98046875, -5.724853515625, -5.46923828125, -5.213623046875, -4.9580078125, -4.702392578125, -4.44677734375, -4.191162109375, -3.935546875, -3.679931640625, -3.42431640625, -3.168701171875, -2.9130859375, -2.657470703125, -2.40185546875, -2.146240234375, -1.890625, -1.635009765625, -1.37939453125, -1.123779296875, -0.8681640625, -0.612548828125, -0.35693359375, -0.101318359375, 0.154296875, 0.409912109375, 0.66552734375, 0.921142578125, 1.1767578125, 1.432373046875, 1.68798828125, 1.943603515625, 2.19921875, 2.454833984375, 2.71044921875, 2.966064453125, 3.2216796875, 3.477294921875, 3.73291015625, 3.988525390625, 4.244140625, 4.499755859375, 4.75537109375, 5.010986328125, 5.2666015625, 5.522216796875, 5.77783203125, 6.033447265625, 6.2890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 5.0, 4.0, 0.0, 7.0, 5.0, 9.0, 11.0, 10.0, 11.0, 15.0, 21.0, 28.0, 47.0, 47.0, 75.0, 118.0, 123.0, 119.0, 111.0, 54.0, 60.0, 30.0, 20.0, 23.0, 6.0, 14.0, 10.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.91796875, -4.77215576171875, -4.6263427734375, -4.48052978515625, -4.334716796875, -4.18890380859375, -4.0430908203125, -3.89727783203125, -3.75146484375, -3.60565185546875, -3.4598388671875, -3.31402587890625, -3.168212890625, -3.02239990234375, -2.8765869140625, -2.73077392578125, -2.5849609375, -2.43914794921875, -2.2933349609375, -2.14752197265625, -2.001708984375, -1.85589599609375, -1.7100830078125, -1.56427001953125, -1.41845703125, -1.27264404296875, -1.1268310546875, -0.98101806640625, -0.835205078125, -0.68939208984375, -0.5435791015625, -0.39776611328125, -0.251953125, -0.10614013671875, 0.0396728515625, 0.18548583984375, 0.331298828125, 0.47711181640625, 0.6229248046875, 0.76873779296875, 0.91455078125, 1.06036376953125, 1.2061767578125, 1.35198974609375, 1.497802734375, 1.64361572265625, 1.7894287109375, 1.93524169921875, 2.0810546875, 2.22686767578125, 2.3726806640625, 2.51849365234375, 2.664306640625, 2.81011962890625, 2.9559326171875, 3.10174560546875, 3.24755859375, 3.39337158203125, 3.5391845703125, 3.68499755859375, 3.830810546875, 3.97662353515625, 4.1224365234375, 4.26824951171875, 4.4140625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 12.0, 19.0, 109.0, 600.0, 229.0, 23.0, 13.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-178.42477416992188, -174.83535766601562, -171.2459259033203, -167.65650939941406, -164.06707763671875, -160.4776611328125, -156.88824462890625, -153.29881286621094, -149.7093963623047, -146.11997985839844, -142.53054809570312, -138.94113159179688, -135.35169982910156, -131.7622833251953, -128.1728515625, -124.58343505859375, -120.99400329589844, -117.40457916259766, -113.81515502929688, -110.22573852539062, -106.63631439208984, -103.04689025878906, -99.45746612548828, -95.8680419921875, -92.27862548828125, -88.68920135498047, -85.09977722167969, -81.51036071777344, -77.92093658447266, -74.33151245117188, -70.7420883178711, -67.15266418457031, -63.5632438659668, -59.973819732666016, -56.3843994140625, -52.79497528076172, -49.20555114746094, -45.616127014160156, -42.02670669555664, -38.43728256225586, -34.847862243652344, -31.258440017700195, -27.669015884399414, -24.079593658447266, -20.490169525146484, -16.900747299194336, -13.311325073242188, -9.721900939941406, -6.132476806640625, -2.5430538654327393, 1.0463690757751465, 4.635791778564453, 8.225214958190918, 11.814638137817383, 15.404060363769531, 18.993484497070312, 22.58290672302246, 26.17232894897461, 29.76175308227539, 33.351173400878906, 36.94059753417969, 40.53002166748047, 44.11944580078125, 47.70886993408203, 51.29829025268555]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 4.0, 6.0, 2.0, 5.0, 6.0, 6.0, 12.0, 26.0, 28.0, 55.0, 76.0, 148.0, 160.0, 146.0, 115.0, 57.0, 37.0, 22.0, 12.0, 14.0, 9.0, 9.0, 3.0, 5.0, 5.0, 3.0, 6.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-89.54913330078125, -86.96958923339844, -84.39004516601562, -81.81050109863281, -79.23095703125, -76.65141296386719, -74.07186889648438, -71.49232482910156, -68.91278076171875, -66.33323669433594, -63.753692626953125, -61.17414855957031, -58.5946044921875, -56.01506042480469, -53.435516357421875, -50.85597229003906, -48.27642822265625, -45.69688415527344, -43.117340087890625, -40.53779602050781, -37.958251953125, -35.37870788574219, -32.799163818359375, -30.219619750976562, -27.64007568359375, -25.060531616210938, -22.480987548828125, -19.901443481445312, -17.3218994140625, -14.742355346679688, -12.162811279296875, -9.583267211914062, -7.00372314453125, -4.4241790771484375, -1.844635009765625, 0.7349090576171875, 3.314453125, 5.8939971923828125, 8.473541259765625, 11.053085327148438, 13.63262939453125, 16.212173461914062, 18.791717529296875, 21.371261596679688, 23.9508056640625, 26.530349731445312, 29.109893798828125, 31.689437866210938, 34.26898193359375, 36.84852600097656, 39.428070068359375, 42.00761413574219, 44.587158203125, 47.16670227050781, 49.746246337890625, 52.32579040527344, 54.90533447265625, 57.48487854003906, 60.064422607421875, 62.64396667480469, 65.2235107421875, 67.80305480957031, 70.38259887695312, 72.96214294433594, 75.54168701171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 15.0, 9.0, 14.0, 37.0, 34.0, 55.0, 71.0, 99.0, 139.0, 230.0, 356.0, 532.0, 823.0, 1312.0, 2073.0, 3782.0, 6856.0, 14597.0, 41500.0, 372621.0, 3632348.0, 75657.0, 20727.0, 8752.0, 4543.0, 2681.0, 1541.0, 954.0, 623.0, 372.0, 303.0, 196.0, 123.0, 79.0, 65.0, 47.0, 30.0, 24.0, 17.0, 12.0, 13.0, 7.0, 6.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.55078125, -5.3466796875, -5.142578125, -4.9384765625, -4.734375, -4.5302734375, -4.326171875, -4.1220703125, -3.91796875, -3.7138671875, -3.509765625, -3.3056640625, -3.1015625, -2.8974609375, -2.693359375, -2.4892578125, -2.28515625, -2.0810546875, -1.876953125, -1.6728515625, -1.46875, -1.2646484375, -1.060546875, -0.8564453125, -0.65234375, -0.4482421875, -0.244140625, -0.0400390625, 0.1640625, 0.3681640625, 0.572265625, 0.7763671875, 0.98046875, 1.1845703125, 1.388671875, 1.5927734375, 1.796875, 2.0009765625, 2.205078125, 2.4091796875, 2.61328125, 2.8173828125, 3.021484375, 3.2255859375, 3.4296875, 3.6337890625, 3.837890625, 4.0419921875, 4.24609375, 4.4501953125, 4.654296875, 4.8583984375, 5.0625, 5.2666015625, 5.470703125, 5.6748046875, 5.87890625, 6.0830078125, 6.287109375, 6.4912109375, 6.6953125, 6.8994140625, 7.103515625, 7.3076171875, 7.51171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 8.0, 12.0, 11.0, 6.0, 3.0, 9.0, 16.0, 34.0, 88.0, 219.0, 286.0, 124.0, 49.0, 18.0, 20.0, 10.0, 10.0, 4.0, 10.0, 6.0, 4.0, 6.0, 5.0, 2.0, 2.0, 4.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68603515625, -0.65985107421875, -0.6336669921875, -0.60748291015625, -0.581298828125, -0.55511474609375, -0.5289306640625, -0.50274658203125, -0.4765625, -0.45037841796875, -0.4241943359375, -0.39801025390625, -0.371826171875, -0.34564208984375, -0.3194580078125, -0.29327392578125, -0.26708984375, -0.24090576171875, -0.2147216796875, -0.18853759765625, -0.162353515625, -0.13616943359375, -0.1099853515625, -0.08380126953125, -0.0576171875, -0.03143310546875, -0.0052490234375, 0.02093505859375, 0.047119140625, 0.07330322265625, 0.0994873046875, 0.12567138671875, 0.15185546875, 0.17803955078125, 0.2042236328125, 0.23040771484375, 0.256591796875, 0.28277587890625, 0.3089599609375, 0.33514404296875, 0.361328125, 0.38751220703125, 0.4136962890625, 0.43988037109375, 0.466064453125, 0.49224853515625, 0.5184326171875, 0.54461669921875, 0.57080078125, 0.59698486328125, 0.6231689453125, 0.64935302734375, 0.675537109375, 0.70172119140625, 0.7279052734375, 0.75408935546875, 0.7802734375, 0.80645751953125, 0.8326416015625, 0.85882568359375, 0.885009765625, 0.91119384765625, 0.9373779296875, 0.96356201171875, 0.98974609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 2.0, 5.0, 8.0, 3.0, 13.0, 11.0, 14.0, 22.0, 25.0, 38.0, 42.0, 73.0, 113.0, 188.0, 337.0, 528.0, 976.0, 1795.0, 3862.0, 10361.0, 40365.0, 416926.0, 3554734.0, 129692.0, 21625.0, 6684.0, 2667.0, 1276.0, 742.0, 420.0, 223.0, 169.0, 109.0, 62.0, 36.0, 35.0, 22.0, 16.0, 16.0, 14.0, 7.0, 8.0, 7.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1953125, -4.0521240234375, -3.908935546875, -3.7657470703125, -3.62255859375, -3.4793701171875, -3.336181640625, -3.1929931640625, -3.0498046875, -2.9066162109375, -2.763427734375, -2.6202392578125, -2.47705078125, -2.3338623046875, -2.190673828125, -2.0474853515625, -1.904296875, -1.7611083984375, -1.617919921875, -1.4747314453125, -1.33154296875, -1.1883544921875, -1.045166015625, -0.9019775390625, -0.7587890625, -0.6156005859375, -0.472412109375, -0.3292236328125, -0.18603515625, -0.0428466796875, 0.100341796875, 0.2435302734375, 0.38671875, 0.5299072265625, 0.673095703125, 0.8162841796875, 0.95947265625, 1.1026611328125, 1.245849609375, 1.3890380859375, 1.5322265625, 1.6754150390625, 1.818603515625, 1.9617919921875, 2.10498046875, 2.2481689453125, 2.391357421875, 2.5345458984375, 2.677734375, 2.8209228515625, 2.964111328125, 3.1072998046875, 3.25048828125, 3.3936767578125, 3.536865234375, 3.6800537109375, 3.8232421875, 3.9664306640625, 4.109619140625, 4.2528076171875, 4.39599609375, 4.5391845703125, 4.682373046875, 4.8255615234375, 4.96875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 5.0, 10.0, 5.0, 14.0, 13.0, 10.0, 27.0, 35.0, 67.0, 108.0, 257.0, 705.0, 1751.0, 575.0, 203.0, 114.0, 57.0, 39.0, 19.0, 19.0, 6.0, 10.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.412109375, -1.3698272705078125, -1.327545166015625, -1.2852630615234375, -1.24298095703125, -1.2006988525390625, -1.158416748046875, -1.1161346435546875, -1.0738525390625, -1.0315704345703125, -0.989288330078125, -0.9470062255859375, -0.90472412109375, -0.8624420166015625, -0.820159912109375, -0.7778778076171875, -0.735595703125, -0.6933135986328125, -0.651031494140625, -0.6087493896484375, -0.56646728515625, -0.5241851806640625, -0.481903076171875, -0.4396209716796875, -0.3973388671875, -0.3550567626953125, -0.312774658203125, -0.2704925537109375, -0.22821044921875, -0.1859283447265625, -0.143646240234375, -0.1013641357421875, -0.05908203125, -0.0167999267578125, 0.025482177734375, 0.0677642822265625, 0.11004638671875, 0.1523284912109375, 0.194610595703125, 0.2368927001953125, 0.2791748046875, 0.3214569091796875, 0.363739013671875, 0.4060211181640625, 0.44830322265625, 0.4905853271484375, 0.532867431640625, 0.5751495361328125, 0.617431640625, 0.6597137451171875, 0.701995849609375, 0.7442779541015625, 0.78656005859375, 0.8288421630859375, 0.871124267578125, 0.9134063720703125, 0.9556884765625, 0.9979705810546875, 1.040252685546875, 1.0825347900390625, 1.12481689453125, 1.1670989990234375, 1.209381103515625, 1.2516632080078125, 1.2939453125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 9.0, 13.0, 43.0, 154.0, 483.0, 239.0, 35.0, 13.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.43277359008789, -15.079437255859375, -14.726099967956543, -14.372763633728027, -14.019427299499512, -13.66609001159668, -13.312753677368164, -12.959417343139648, -12.606081008911133, -12.252744674682617, -11.899407386779785, -11.54607105255127, -11.192734718322754, -10.839397430419922, -10.486061096191406, -10.13272476196289, -9.779387474060059, -9.426051139831543, -9.072713851928711, -8.719377517700195, -8.36604118347168, -8.012704849243164, -7.659367561340332, -7.306031227111816, -6.952694416046143, -6.599357604980469, -6.246021270751953, -5.892684459686279, -5.5393476486206055, -5.18601131439209, -4.832674503326416, -4.479337692260742, -4.126000881195068, -3.7726643085479736, -3.419327735900879, -3.065990924835205, -2.7126543521881104, -2.3593177795410156, -2.005980968475342, -1.652644395828247, -1.2993078231811523, -0.9459711909294128, -0.5926345586776733, -0.23929786682128906, 0.11403870582580566, 0.4673752784729004, 0.8207120895385742, 1.174048662185669, 1.5273852348327637, 1.8807218074798584, 2.234058380126953, 2.587395191192627, 2.9407317638397217, 3.2940683364868164, 3.6474051475524902, 4.000741958618164, 4.35407829284668, 4.7074151039123535, 5.060751438140869, 5.414088249206543, 5.767424583435059, 6.120761394500732, 6.474098205566406, 6.827434539794922, 7.180771350860596]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 10.0, 5.0, 7.0, 4.0, 6.0, 16.0, 28.0, 32.0, 26.0, 52.0, 91.0, 86.0, 91.0, 89.0, 102.0, 85.0, 68.0, 45.0, 31.0, 29.0, 20.0, 12.0, 13.0, 14.0, 8.0, 2.0, 6.0, 3.0, 4.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.185232162475586, -5.993945121765137, -5.802658557891846, -5.6113715171813965, -5.420084476470947, -5.228797912597656, -5.037510871887207, -4.846223831176758, -4.654936790466309, -4.463649749755859, -4.272363185882568, -4.081076145172119, -3.88978910446167, -3.6985023021698, -3.5072154998779297, -3.3159284591674805, -3.1246418952941895, -2.9333550930023193, -2.74206805229187, -2.55078125, -2.359494209289551, -2.1682074069976807, -1.9769206047058105, -1.7856336832046509, -1.5943467617034912, -1.4030598402023315, -1.2117729187011719, -1.0204861164093018, -0.8291991949081421, -0.6379122734069824, -0.4466254711151123, -0.25533854961395264, -0.06405162811279297, 0.1272352635860443, 0.3185221552848816, 0.5098090171813965, 0.7010959386825562, 0.8923828601837158, 1.083669662475586, 1.2749565839767456, 1.4662435054779053, 1.657530426979065, 1.8488173484802246, 2.0401041507720947, 2.231390953063965, 2.422677993774414, 2.613964796066284, 2.8052515983581543, 2.9965386390686035, 3.1878254413604736, 3.379112482070923, 3.570399284362793, 3.761686325073242, 3.9529731273651123, 4.144259929656982, 4.335546970367432, 4.526833534240723, 4.718120574951172, 4.909407138824463, 5.100694179534912, 5.291981220245361, 5.483267784118652, 5.674554824829102, 5.865841865539551, 6.05712890625]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 6.0, 12.0, 9.0, 17.0, 28.0, 48.0, 67.0, 79.0, 136.0, 166.0, 317.0, 437.0, 736.0, 1308.0, 2300.0, 4058.0, 7926.0, 17908.0, 60901.0, 759322.0, 144966.0, 25490.0, 10457.0, 5126.0, 2735.0, 1515.0, 934.0, 544.0, 342.0, 205.0, 142.0, 100.0, 63.0, 54.0, 29.0, 14.0, 19.0, 9.0, 7.0, 6.0, 3.0, 2.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.25, -4.1158447265625, -3.981689453125, -3.8475341796875, -3.71337890625, -3.5792236328125, -3.445068359375, -3.3109130859375, -3.1767578125, -3.0426025390625, -2.908447265625, -2.7742919921875, -2.64013671875, -2.5059814453125, -2.371826171875, -2.2376708984375, -2.103515625, -1.9693603515625, -1.835205078125, -1.7010498046875, -1.56689453125, -1.4327392578125, -1.298583984375, -1.1644287109375, -1.0302734375, -0.8961181640625, -0.761962890625, -0.6278076171875, -0.49365234375, -0.3594970703125, -0.225341796875, -0.0911865234375, 0.04296875, 0.1771240234375, 0.311279296875, 0.4454345703125, 0.57958984375, 0.7137451171875, 0.847900390625, 0.9820556640625, 1.1162109375, 1.2503662109375, 1.384521484375, 1.5186767578125, 1.65283203125, 1.7869873046875, 1.921142578125, 2.0552978515625, 2.189453125, 2.3236083984375, 2.457763671875, 2.5919189453125, 2.72607421875, 2.8602294921875, 2.994384765625, 3.1285400390625, 3.2626953125, 3.3968505859375, 3.531005859375, 3.6651611328125, 3.79931640625, 3.9334716796875, 4.067626953125, 4.2017822265625, 4.3359375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 2.0, 5.0, 5.0, 2.0, 7.0, 11.0, 7.0, 12.0, 12.0, 16.0, 37.0, 80.0, 206.0, 247.0, 166.0, 63.0, 41.0, 15.0, 15.0, 10.0, 8.0, 3.0, 4.0, 2.0, 4.0, 7.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5869140625, -0.5629425048828125, -0.538970947265625, -0.5149993896484375, -0.49102783203125, -0.4670562744140625, -0.443084716796875, -0.4191131591796875, -0.3951416015625, -0.3711700439453125, -0.347198486328125, -0.3232269287109375, -0.29925537109375, -0.2752838134765625, -0.251312255859375, -0.2273406982421875, -0.203369140625, -0.1793975830078125, -0.155426025390625, -0.1314544677734375, -0.10748291015625, -0.0835113525390625, -0.059539794921875, -0.0355682373046875, -0.0115966796875, 0.0123748779296875, 0.036346435546875, 0.0603179931640625, 0.08428955078125, 0.1082611083984375, 0.132232666015625, 0.1562042236328125, 0.18017578125, 0.2041473388671875, 0.228118896484375, 0.2520904541015625, 0.27606201171875, 0.3000335693359375, 0.324005126953125, 0.3479766845703125, 0.3719482421875, 0.3959197998046875, 0.419891357421875, 0.4438629150390625, 0.46783447265625, 0.4918060302734375, 0.515777587890625, 0.5397491455078125, 0.563720703125, 0.5876922607421875, 0.611663818359375, 0.6356353759765625, 0.65960693359375, 0.6835784912109375, 0.707550048828125, 0.7315216064453125, 0.7554931640625, 0.7794647216796875, 0.803436279296875, 0.8274078369140625, 0.85137939453125, 0.8753509521484375, 0.899322509765625, 0.9232940673828125, 0.947265625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 5.0, 3.0, 7.0, 3.0, 12.0, 13.0, 17.0, 21.0, 23.0, 43.0, 68.0, 74.0, 119.0, 215.0, 344.0, 568.0, 960.0, 1985.0, 3982.0, 9384.0, 25684.0, 84290.0, 345345.0, 418083.0, 106155.0, 31093.0, 11009.0, 4542.0, 2096.0, 966.0, 540.0, 298.0, 199.0, 130.0, 81.0, 55.0, 29.0, 33.0, 22.0, 18.0, 11.0, 9.0, 6.0, 2.0, 5.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.173828125, -2.1060791015625, -2.038330078125, -1.9705810546875, -1.90283203125, -1.8350830078125, -1.767333984375, -1.6995849609375, -1.6318359375, -1.5640869140625, -1.496337890625, -1.4285888671875, -1.36083984375, -1.2930908203125, -1.225341796875, -1.1575927734375, -1.08984375, -1.0220947265625, -0.954345703125, -0.8865966796875, -0.81884765625, -0.7510986328125, -0.683349609375, -0.6156005859375, -0.5478515625, -0.4801025390625, -0.412353515625, -0.3446044921875, -0.27685546875, -0.2091064453125, -0.141357421875, -0.0736083984375, -0.005859375, 0.0618896484375, 0.129638671875, 0.1973876953125, 0.26513671875, 0.3328857421875, 0.400634765625, 0.4683837890625, 0.5361328125, 0.6038818359375, 0.671630859375, 0.7393798828125, 0.80712890625, 0.8748779296875, 0.942626953125, 1.0103759765625, 1.078125, 1.1458740234375, 1.213623046875, 1.2813720703125, 1.34912109375, 1.4168701171875, 1.484619140625, 1.5523681640625, 1.6201171875, 1.6878662109375, 1.755615234375, 1.8233642578125, 1.89111328125, 1.9588623046875, 2.026611328125, 2.0943603515625, 2.162109375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 7.0, 2.0, 5.0, 3.0, 11.0, 6.0, 5.0, 13.0, 13.0, 15.0, 15.0, 23.0, 26.0, 32.0, 35.0, 39.0, 34.0, 39.0, 45.0, 45.0, 55.0, 45.0, 46.0, 49.0, 49.0, 30.0, 40.0, 34.0, 42.0, 32.0, 30.0, 19.0, 21.0, 20.0, 15.0, 10.0, 15.0, 9.0, 8.0, 7.0, 2.0, 6.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.564453125, -2.494842529296875, -2.42523193359375, -2.355621337890625, -2.2860107421875, -2.216400146484375, -2.14678955078125, -2.077178955078125, -2.007568359375, -1.937957763671875, -1.86834716796875, -1.798736572265625, -1.7291259765625, -1.659515380859375, -1.58990478515625, -1.520294189453125, -1.45068359375, -1.381072998046875, -1.31146240234375, -1.241851806640625, -1.1722412109375, -1.102630615234375, -1.03302001953125, -0.963409423828125, -0.893798828125, -0.824188232421875, -0.75457763671875, -0.684967041015625, -0.6153564453125, -0.545745849609375, -0.47613525390625, -0.406524658203125, -0.3369140625, -0.267303466796875, -0.19769287109375, -0.128082275390625, -0.0584716796875, 0.011138916015625, 0.08074951171875, 0.150360107421875, 0.219970703125, 0.289581298828125, 0.35919189453125, 0.428802490234375, 0.4984130859375, 0.568023681640625, 0.63763427734375, 0.707244873046875, 0.77685546875, 0.846466064453125, 0.91607666015625, 0.985687255859375, 1.0552978515625, 1.124908447265625, 1.19451904296875, 1.264129638671875, 1.333740234375, 1.403350830078125, 1.47296142578125, 1.542572021484375, 1.6121826171875, 1.681793212890625, 1.75140380859375, 1.821014404296875, 1.890625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 5.0, 1.0, 6.0, 2.0, 6.0, 10.0, 11.0, 35.0, 35.0, 66.0, 113.0, 174.0, 337.0, 999.0, 6059.0, 921584.0, 114576.0, 3093.0, 749.0, 257.0, 143.0, 95.0, 56.0, 34.0, 40.0, 16.0, 13.0, 7.0, 7.0, 10.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.609375, -16.1461181640625, -15.682861328125, -15.2196044921875, -14.75634765625, -14.2930908203125, -13.829833984375, -13.3665771484375, -12.9033203125, -12.4400634765625, -11.976806640625, -11.5135498046875, -11.05029296875, -10.5870361328125, -10.123779296875, -9.6605224609375, -9.197265625, -8.7340087890625, -8.270751953125, -7.8074951171875, -7.34423828125, -6.8809814453125, -6.417724609375, -5.9544677734375, -5.4912109375, -5.0279541015625, -4.564697265625, -4.1014404296875, -3.63818359375, -3.1749267578125, -2.711669921875, -2.2484130859375, -1.78515625, -1.3218994140625, -0.858642578125, -0.3953857421875, 0.06787109375, 0.5311279296875, 0.994384765625, 1.4576416015625, 1.9208984375, 2.3841552734375, 2.847412109375, 3.3106689453125, 3.77392578125, 4.2371826171875, 4.700439453125, 5.1636962890625, 5.626953125, 6.0902099609375, 6.553466796875, 7.0167236328125, 7.47998046875, 7.9432373046875, 8.406494140625, 8.8697509765625, 9.3330078125, 9.7962646484375, 10.259521484375, 10.7227783203125, 11.18603515625, 11.6492919921875, 12.112548828125, 12.5758056640625, 13.0390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 0.0, 4.0, 5.0, 7.0, 11.0, 33.0, 56.0, 103.0, 195.0, 249.0, 181.0, 59.0, 28.0, 20.0, 16.0, 6.0, 2.0, 3.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002853870391845703, -0.0002756677567958832, -0.00026594847440719604, -0.0002562291920185089, -0.0002465099096298218, -0.00023679062724113464, -0.0002270713448524475, -0.00021735206246376038, -0.00020763278007507324, -0.0001979134976863861, -0.00018819421529769897, -0.00017847493290901184, -0.0001687556505203247, -0.00015903636813163757, -0.00014931708574295044, -0.0001395978033542633, -0.00012987852096557617, -0.00012015923857688904, -0.0001104399561882019, -0.00010072067379951477, -9.100139141082764e-05, -8.12821090221405e-05, -7.156282663345337e-05, -6.184354424476624e-05, -5.21242618560791e-05, -4.240497946739197e-05, -3.2685697078704834e-05, -2.29664146900177e-05, -1.3247132301330566e-05, -3.5278499126434326e-06, 6.191432476043701e-06, 1.5910714864730835e-05, 2.562999725341797e-05, 3.53492796421051e-05, 4.5068562030792236e-05, 5.478784441947937e-05, 6.45071268081665e-05, 7.422640919685364e-05, 8.394569158554077e-05, 9.36649739742279e-05, 0.00010338425636291504, 0.00011310353875160217, 0.0001228228211402893, 0.00013254210352897644, 0.00014226138591766357, 0.0001519806683063507, 0.00016169995069503784, 0.00017141923308372498, 0.0001811385154724121, 0.00019085779786109924, 0.00020057708024978638, 0.0002102963626384735, 0.00022001564502716064, 0.00022973492741584778, 0.0002394542098045349, 0.00024917349219322205, 0.0002588927745819092, 0.0002686120569705963, 0.00027833133935928345, 0.0002880506217479706, 0.0002977699041366577, 0.00030748918652534485, 0.000317208468914032, 0.0003269277513027191, 0.00033664703369140625]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 3.0, 7.0, 8.0, 4.0, 14.0, 22.0, 29.0, 32.0, 67.0, 102.0, 166.0, 304.0, 490.0, 988.0, 2369.0, 9338.0, 88634.0, 862506.0, 70979.0, 8297.0, 2200.0, 904.0, 437.0, 245.0, 150.0, 102.0, 52.0, 31.0, 18.0, 14.0, 9.0, 5.0, 7.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.84765625, -4.69830322265625, -4.5489501953125, -4.39959716796875, -4.250244140625, -4.10089111328125, -3.9515380859375, -3.80218505859375, -3.65283203125, -3.50347900390625, -3.3541259765625, -3.20477294921875, -3.055419921875, -2.90606689453125, -2.7567138671875, -2.60736083984375, -2.4580078125, -2.30865478515625, -2.1593017578125, -2.00994873046875, -1.860595703125, -1.71124267578125, -1.5618896484375, -1.41253662109375, -1.26318359375, -1.11383056640625, -0.9644775390625, -0.81512451171875, -0.665771484375, -0.51641845703125, -0.3670654296875, -0.21771240234375, -0.068359375, 0.08099365234375, 0.2303466796875, 0.37969970703125, 0.529052734375, 0.67840576171875, 0.8277587890625, 0.97711181640625, 1.12646484375, 1.27581787109375, 1.4251708984375, 1.57452392578125, 1.723876953125, 1.87322998046875, 2.0225830078125, 2.17193603515625, 2.3212890625, 2.47064208984375, 2.6199951171875, 2.76934814453125, 2.918701171875, 3.06805419921875, 3.2174072265625, 3.36676025390625, 3.51611328125, 3.66546630859375, 3.8148193359375, 3.96417236328125, 4.113525390625, 4.26287841796875, 4.4122314453125, 4.56158447265625, 4.7109375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 10.0, 10.0, 16.0, 33.0, 66.0, 125.0, 207.0, 234.0, 128.0, 77.0, 48.0, 17.0, 6.0, 8.0, 4.0, 7.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.85546875, -5.68328857421875, -5.5111083984375, -5.33892822265625, -5.166748046875, -4.99456787109375, -4.8223876953125, -4.65020751953125, -4.47802734375, -4.30584716796875, -4.1336669921875, -3.96148681640625, -3.789306640625, -3.61712646484375, -3.4449462890625, -3.27276611328125, -3.1005859375, -2.92840576171875, -2.7562255859375, -2.58404541015625, -2.411865234375, -2.23968505859375, -2.0675048828125, -1.89532470703125, -1.72314453125, -1.55096435546875, -1.3787841796875, -1.20660400390625, -1.034423828125, -0.86224365234375, -0.6900634765625, -0.51788330078125, -0.345703125, -0.17352294921875, -0.0013427734375, 0.17083740234375, 0.343017578125, 0.51519775390625, 0.6873779296875, 0.85955810546875, 1.03173828125, 1.20391845703125, 1.3760986328125, 1.54827880859375, 1.720458984375, 1.89263916015625, 2.0648193359375, 2.23699951171875, 2.4091796875, 2.58135986328125, 2.7535400390625, 2.92572021484375, 3.097900390625, 3.27008056640625, 3.4422607421875, 3.61444091796875, 3.78662109375, 3.95880126953125, 4.1309814453125, 4.30316162109375, 4.475341796875, 4.64752197265625, 4.8197021484375, 4.99188232421875, 5.1640625]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 13.0, 31.0, 85.0, 269.0, 377.0, 126.0, 57.0, 18.0, 2.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.457561492919922, -21.293838500976562, -20.130117416381836, -18.96639633178711, -17.80267333984375, -16.63895034790039, -15.475229263305664, -14.311507225036621, -13.147785186767578, -11.984063148498535, -10.820341110229492, -9.65661907196045, -8.492897033691406, -7.329174995422363, -6.16545295715332, -5.001730918884277, -3.8380088806152344, -2.6742868423461914, -1.5105648040771484, -0.34684276580810547, 0.8168792724609375, 1.9806013107299805, 3.1443233489990234, 4.308045387268066, 5.471767425537109, 6.635489463806152, 7.799211502075195, 8.962933540344238, 10.126655578613281, 11.290377616882324, 12.454099655151367, 13.61782169342041, 14.781547546386719, 15.945269584655762, 17.108991622924805, 18.27271270751953, 19.43643569946289, 20.60015869140625, 21.763879776000977, 22.927600860595703, 24.091323852539062, 25.255046844482422, 26.41876792907715, 27.582489013671875, 28.746212005615234, 29.909934997558594, 31.07365608215332, 32.23737716674805, 33.401100158691406, 34.564823150634766, 35.728546142578125, 36.89226531982422, 38.05598831176758, 39.21971130371094, 40.38343048095703, 41.54715347290039, 42.71087646484375, 43.87459945678711, 45.03832244873047, 46.20204162597656, 47.36576461791992, 48.52948760986328, 49.693206787109375, 50.856929779052734, 52.020652770996094]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 6.0, 3.0, 4.0, 8.0, 11.0, 18.0, 28.0, 46.0, 68.0, 63.0, 64.0, 90.0, 95.0, 95.0, 91.0, 63.0, 57.0, 52.0, 44.0, 19.0, 16.0, 16.0, 7.0, 3.0, 4.0, 2.0, 4.0, 5.0, 2.0, 5.0, 3.0, 0.0, 5.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.911659240722656, -31.992645263671875, -31.07362937927246, -30.154613494873047, -29.235599517822266, -28.316585540771484, -27.39756965637207, -26.478553771972656, -25.559539794921875, -24.640525817871094, -23.72150993347168, -22.802494049072266, -21.883480072021484, -20.964466094970703, -20.04545021057129, -19.126434326171875, -18.207420349121094, -17.288406372070312, -16.3693904876709, -15.4503755569458, -14.531360626220703, -13.612345695495605, -12.693330764770508, -11.77431583404541, -10.855300903320312, -9.936285972595215, -9.017271041870117, -8.09825611114502, -7.179241180419922, -6.260226249694824, -5.341211318969727, -4.422196388244629, -3.5031814575195312, -2.5841665267944336, -1.665151596069336, -0.7461366653442383, 0.17287826538085938, 1.091893196105957, 2.0109081268310547, 2.9299230575561523, 3.84893798828125, 4.767952919006348, 5.686967849731445, 6.605982780456543, 7.524997711181641, 8.444012641906738, 9.363027572631836, 10.282042503356934, 11.201057434082031, 12.120072364807129, 13.039087295532227, 13.958102226257324, 14.877117156982422, 15.79613208770752, 16.715147018432617, 17.63416290283203, 18.553176879882812, 19.472190856933594, 20.391206741333008, 21.310222625732422, 22.229236602783203, 23.148250579833984, 24.0672664642334, 24.986282348632812, 25.905296325683594]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 7.0, 7.0, 9.0, 13.0, 34.0, 26.0, 47.0, 59.0, 100.0, 115.0, 194.0, 307.0, 406.0, 721.0, 1210.0, 2524.0, 6735.0, 32271.0, 3906494.0, 218218.0, 15427.0, 4222.0, 1917.0, 1105.0, 646.0, 419.0, 264.0, 210.0, 126.0, 92.0, 90.0, 64.0, 34.0, 26.0, 30.0, 27.0, 18.0, 10.0, 10.0, 16.0, 7.0, 4.0, 8.0, 2.0, 3.0, 6.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.1640625, -8.7789306640625, -8.393798828125, -8.0086669921875, -7.62353515625, -7.2384033203125, -6.853271484375, -6.4681396484375, -6.0830078125, -5.6978759765625, -5.312744140625, -4.9276123046875, -4.54248046875, -4.1573486328125, -3.772216796875, -3.3870849609375, -3.001953125, -2.6168212890625, -2.231689453125, -1.8465576171875, -1.46142578125, -1.0762939453125, -0.691162109375, -0.3060302734375, 0.0791015625, 0.4642333984375, 0.849365234375, 1.2344970703125, 1.61962890625, 2.0047607421875, 2.389892578125, 2.7750244140625, 3.16015625, 3.5452880859375, 3.930419921875, 4.3155517578125, 4.70068359375, 5.0858154296875, 5.470947265625, 5.8560791015625, 6.2412109375, 6.6263427734375, 7.011474609375, 7.3966064453125, 7.78173828125, 8.1668701171875, 8.552001953125, 8.9371337890625, 9.322265625, 9.7073974609375, 10.092529296875, 10.4776611328125, 10.86279296875, 11.2479248046875, 11.633056640625, 12.0181884765625, 12.4033203125, 12.7884521484375, 13.173583984375, 13.5587158203125, 13.94384765625, 14.3289794921875, 14.714111328125, 15.0992431640625, 15.484375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 7.0, 4.0, 2.0, 11.0, 14.0, 20.0, 24.0, 52.0, 105.0, 172.0, 226.0, 156.0, 86.0, 48.0, 20.0, 7.0, 7.0, 9.0, 7.0, 6.0, 2.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.63818359375, -0.6108932495117188, -0.5836029052734375, -0.5563125610351562, -0.529022216796875, -0.5017318725585938, -0.4744415283203125, -0.44715118408203125, -0.41986083984375, -0.39257049560546875, -0.3652801513671875, -0.33798980712890625, -0.310699462890625, -0.28340911865234375, -0.2561187744140625, -0.22882843017578125, -0.2015380859375, -0.17424774169921875, -0.1469573974609375, -0.11966705322265625, -0.092376708984375, -0.06508636474609375, -0.0377960205078125, -0.01050567626953125, 0.01678466796875, 0.04407501220703125, 0.0713653564453125, 0.09865570068359375, 0.125946044921875, 0.15323638916015625, 0.1805267333984375, 0.20781707763671875, 0.235107421875, 0.26239776611328125, 0.2896881103515625, 0.31697845458984375, 0.344268798828125, 0.37155914306640625, 0.3988494873046875, 0.42613983154296875, 0.45343017578125, 0.48072052001953125, 0.5080108642578125, 0.5353012084960938, 0.562591552734375, 0.5898818969726562, 0.6171722412109375, 0.6444625854492188, 0.6717529296875, 0.6990432739257812, 0.7263336181640625, 0.7536239624023438, 0.780914306640625, 0.8082046508789062, 0.8354949951171875, 0.8627853393554688, 0.89007568359375, 0.9173660278320312, 0.9446563720703125, 0.9719467163085938, 0.999237060546875, 1.0265274047851562, 1.0538177490234375, 1.0811080932617188, 1.1083984375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 2.0, 7.0, 6.0, 4.0, 10.0, 13.0, 14.0, 26.0, 26.0, 86.0, 148.0, 444.0, 2193.0, 30290.0, 4101661.0, 55612.0, 2916.0, 489.0, 141.0, 62.0, 44.0, 28.0, 13.0, 11.0, 11.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.28125, -12.860595703125, -12.43994140625, -12.019287109375, -11.5986328125, -11.177978515625, -10.75732421875, -10.336669921875, -9.916015625, -9.495361328125, -9.07470703125, -8.654052734375, -8.2333984375, -7.812744140625, -7.39208984375, -6.971435546875, -6.55078125, -6.130126953125, -5.70947265625, -5.288818359375, -4.8681640625, -4.447509765625, -4.02685546875, -3.606201171875, -3.185546875, -2.764892578125, -2.34423828125, -1.923583984375, -1.5029296875, -1.082275390625, -0.66162109375, -0.240966796875, 0.1796875, 0.600341796875, 1.02099609375, 1.441650390625, 1.8623046875, 2.282958984375, 2.70361328125, 3.124267578125, 3.544921875, 3.965576171875, 4.38623046875, 4.806884765625, 5.2275390625, 5.648193359375, 6.06884765625, 6.489501953125, 6.91015625, 7.330810546875, 7.75146484375, 8.172119140625, 8.5927734375, 9.013427734375, 9.43408203125, 9.854736328125, 10.275390625, 10.696044921875, 11.11669921875, 11.537353515625, 11.9580078125, 12.378662109375, 12.79931640625, 13.219970703125, 13.640625]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 0.0, 5.0, 4.0, 3.0, 7.0, 6.0, 11.0, 11.0, 22.0, 28.0, 55.0, 53.0, 128.0, 276.0, 672.0, 1596.0, 556.0, 244.0, 164.0, 69.0, 47.0, 33.0, 22.0, 16.0, 18.0, 5.0, 5.0, 4.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1103515625, -1.0780487060546875, -1.045745849609375, -1.0134429931640625, -0.98114013671875, -0.9488372802734375, -0.916534423828125, -0.8842315673828125, -0.8519287109375, -0.8196258544921875, -0.787322998046875, -0.7550201416015625, -0.72271728515625, -0.6904144287109375, -0.658111572265625, -0.6258087158203125, -0.593505859375, -0.5612030029296875, -0.528900146484375, -0.4965972900390625, -0.46429443359375, -0.4319915771484375, -0.399688720703125, -0.3673858642578125, -0.3350830078125, -0.3027801513671875, -0.270477294921875, -0.2381744384765625, -0.20587158203125, -0.1735687255859375, -0.141265869140625, -0.1089630126953125, -0.07666015625, -0.0443572998046875, -0.012054443359375, 0.0202484130859375, 0.05255126953125, 0.0848541259765625, 0.117156982421875, 0.1494598388671875, 0.1817626953125, 0.2140655517578125, 0.246368408203125, 0.2786712646484375, 0.31097412109375, 0.3432769775390625, 0.375579833984375, 0.4078826904296875, 0.440185546875, 0.4724884033203125, 0.504791259765625, 0.5370941162109375, 0.56939697265625, 0.6016998291015625, 0.634002685546875, 0.6663055419921875, 0.6986083984375, 0.7309112548828125, 0.763214111328125, 0.7955169677734375, 0.82781982421875, 0.8601226806640625, 0.892425537109375, 0.9247283935546875, 0.95703125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 11.0, 30.0, 81.0, 231.0, 317.0, 210.0, 68.0, 28.0, 11.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.44077730178833, -7.2099175453186035, -6.979057788848877, -6.748197555541992, -6.517337799072266, -6.286478042602539, -6.0556182861328125, -5.824758529663086, -5.593898773193359, -5.363039016723633, -5.132179260253906, -4.90131950378418, -4.670459270477295, -4.439599514007568, -4.208739757537842, -3.9778800010681152, -3.7470197677612305, -3.516160011291504, -3.2853000164031982, -3.0544402599334717, -2.823580265045166, -2.5927205085754395, -2.361860752105713, -2.1310009956359863, -1.9001410007476807, -1.6692811250686646, -1.4384212493896484, -1.2075614929199219, -0.9767016172409058, -0.7458417415618896, -0.5149819850921631, -0.284122109413147, -0.053261756896972656, 0.17759808897972107, 0.4084579348564148, 0.6393177509307861, 0.8701776266098022, 1.1010375022888184, 1.331897258758545, 1.562757134437561, 1.7936170101165771, 2.0244767665863037, 2.2553367614746094, 2.486196517944336, 2.7170562744140625, 2.947916269302368, 3.1787760257720947, 3.4096360206604004, 3.640495777130127, 3.8713555335998535, 4.10221529006958, 4.333075523376465, 4.563935279846191, 4.794795036315918, 5.0256547927856445, 5.256514549255371, 5.487374305725098, 5.718234062194824, 5.949093818664551, 6.179953575134277, 6.410813808441162, 6.641673564910889, 6.872533321380615, 7.103393077850342, 7.334253311157227]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 7.0, 3.0, 8.0, 8.0, 10.0, 15.0, 18.0, 27.0, 32.0, 32.0, 49.0, 51.0, 63.0, 53.0, 72.0, 72.0, 53.0, 55.0, 52.0, 46.0, 45.0, 42.0, 32.0, 30.0, 27.0, 14.0, 15.0, 11.0, 8.0, 14.0, 3.0, 3.0, 5.0, 5.0, 7.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.883978843688965, -4.759563446044922, -4.635148048400879, -4.510732650756836, -4.386317253112793, -4.26190185546875, -4.137486457824707, -4.013071060180664, -3.888655662536621, -3.764240264892578, -3.639824867248535, -3.515409469604492, -3.390994071960449, -3.2665786743164062, -3.1421632766723633, -3.0177478790283203, -2.8933324813842773, -2.7689170837402344, -2.6445016860961914, -2.5200862884521484, -2.3956708908081055, -2.2712554931640625, -2.1468400955200195, -2.0224246978759766, -1.8980093002319336, -1.7735939025878906, -1.6491785049438477, -1.5247631072998047, -1.4003477096557617, -1.2759323120117188, -1.1515169143676758, -1.0271015167236328, -0.9026861190795898, -0.7782707214355469, -0.6538553237915039, -0.5294399261474609, -0.40502452850341797, -0.280609130859375, -0.15619373321533203, -0.03177833557128906, 0.0926370620727539, 0.21705245971679688, 0.34146785736083984, 0.4658832550048828, 0.5902986526489258, 0.7147140502929688, 0.8391294479370117, 0.9635448455810547, 1.0879602432250977, 1.2123756408691406, 1.3367910385131836, 1.4612064361572266, 1.5856218338012695, 1.7100372314453125, 1.8344526290893555, 1.9588680267333984, 2.0832834243774414, 2.2076988220214844, 2.3321142196655273, 2.4565296173095703, 2.5809450149536133, 2.7053604125976562, 2.829775810241699, 2.954191207885742, 3.078606605529785]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 6.0, 11.0, 13.0, 13.0, 14.0, 54.0, 37.0, 96.0, 169.0, 253.0, 473.0, 951.0, 2320.0, 8000.0, 74725.0, 887709.0, 62222.0, 7349.0, 2130.0, 877.0, 468.0, 225.0, 166.0, 83.0, 46.0, 43.0, 27.0, 31.0, 11.0, 3.0, 11.0, 4.0, 1.0, 6.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.54296875, -7.32415771484375, -7.1053466796875, -6.88653564453125, -6.667724609375, -6.44891357421875, -6.2301025390625, -6.01129150390625, -5.79248046875, -5.57366943359375, -5.3548583984375, -5.13604736328125, -4.917236328125, -4.69842529296875, -4.4796142578125, -4.26080322265625, -4.0419921875, -3.82318115234375, -3.6043701171875, -3.38555908203125, -3.166748046875, -2.94793701171875, -2.7291259765625, -2.51031494140625, -2.29150390625, -2.07269287109375, -1.8538818359375, -1.63507080078125, -1.416259765625, -1.19744873046875, -0.9786376953125, -0.75982666015625, -0.541015625, -0.32220458984375, -0.1033935546875, 0.11541748046875, 0.334228515625, 0.55303955078125, 0.7718505859375, 0.99066162109375, 1.20947265625, 1.42828369140625, 1.6470947265625, 1.86590576171875, 2.084716796875, 2.30352783203125, 2.5223388671875, 2.74114990234375, 2.9599609375, 3.17877197265625, 3.3975830078125, 3.61639404296875, 3.835205078125, 4.05401611328125, 4.2728271484375, 4.49163818359375, 4.71044921875, 4.92926025390625, 5.1480712890625, 5.36688232421875, 5.585693359375, 5.80450439453125, 6.0233154296875, 6.24212646484375, 6.4609375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 8.0, 3.0, 12.0, 9.0, 24.0, 55.0, 105.0, 148.0, 217.0, 162.0, 113.0, 69.0, 32.0, 11.0, 8.0, 7.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59716796875, -0.5708541870117188, -0.5445404052734375, -0.5182266235351562, -0.491912841796875, -0.46559906005859375, -0.4392852783203125, -0.41297149658203125, -0.38665771484375, -0.36034393310546875, -0.3340301513671875, -0.30771636962890625, -0.281402587890625, -0.25508880615234375, -0.2287750244140625, -0.20246124267578125, -0.1761474609375, -0.14983367919921875, -0.1235198974609375, -0.09720611572265625, -0.070892333984375, -0.04457855224609375, -0.0182647705078125, 0.00804901123046875, 0.03436279296875, 0.06067657470703125, 0.0869903564453125, 0.11330413818359375, 0.139617919921875, 0.16593170166015625, 0.1922454833984375, 0.21855926513671875, 0.244873046875, 0.27118682861328125, 0.2975006103515625, 0.32381439208984375, 0.350128173828125, 0.37644195556640625, 0.4027557373046875, 0.42906951904296875, 0.45538330078125, 0.48169708251953125, 0.5080108642578125, 0.5343246459960938, 0.560638427734375, 0.5869522094726562, 0.6132659912109375, 0.6395797729492188, 0.6658935546875, 0.6922073364257812, 0.7185211181640625, 0.7448348999023438, 0.771148681640625, 0.7974624633789062, 0.8237762451171875, 0.8500900268554688, 0.87640380859375, 0.9027175903320312, 0.9290313720703125, 0.9553451538085938, 0.981658935546875, 1.0079727172851562, 1.0342864990234375, 1.0606002807617188, 1.0869140625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 9.0, 9.0, 18.0, 22.0, 16.0, 35.0, 29.0, 46.0, 51.0, 74.0, 107.0, 115.0, 160.0, 265.0, 344.0, 586.0, 1062.0, 1979.0, 4663.0, 11664.0, 32385.0, 108016.0, 391198.0, 352103.0, 94105.0, 29338.0, 10543.0, 4528.0, 2100.0, 1086.0, 560.0, 361.0, 243.0, 177.0, 131.0, 79.0, 73.0, 56.0, 37.0, 39.0, 28.0, 23.0, 17.0, 12.0, 8.0, 13.0, 8.0, 11.0, 7.0, 10.0, 3.0, 3.0, 3.0], "bins": [-2.73828125, -2.657623291015625, -2.57696533203125, -2.496307373046875, -2.4156494140625, -2.334991455078125, -2.25433349609375, -2.173675537109375, -2.093017578125, -2.012359619140625, -1.93170166015625, -1.851043701171875, -1.7703857421875, -1.689727783203125, -1.60906982421875, -1.528411865234375, -1.44775390625, -1.367095947265625, -1.28643798828125, -1.205780029296875, -1.1251220703125, -1.044464111328125, -0.96380615234375, -0.883148193359375, -0.802490234375, -0.721832275390625, -0.64117431640625, -0.560516357421875, -0.4798583984375, -0.399200439453125, -0.31854248046875, -0.237884521484375, -0.1572265625, -0.076568603515625, 0.00408935546875, 0.084747314453125, 0.1654052734375, 0.246063232421875, 0.32672119140625, 0.407379150390625, 0.488037109375, 0.568695068359375, 0.64935302734375, 0.730010986328125, 0.8106689453125, 0.891326904296875, 0.97198486328125, 1.052642822265625, 1.13330078125, 1.213958740234375, 1.29461669921875, 1.375274658203125, 1.4559326171875, 1.536590576171875, 1.61724853515625, 1.697906494140625, 1.778564453125, 1.859222412109375, 1.93988037109375, 2.020538330078125, 2.1011962890625, 2.181854248046875, 2.26251220703125, 2.343170166015625, 2.423828125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 0.0, 4.0, 3.0, 9.0, 11.0, 6.0, 6.0, 15.0, 15.0, 20.0, 23.0, 24.0, 22.0, 35.0, 36.0, 31.0, 37.0, 38.0, 44.0, 46.0, 42.0, 43.0, 47.0, 55.0, 34.0, 35.0, 41.0, 37.0, 35.0, 25.0, 23.0, 24.0, 21.0, 17.0, 18.0, 15.0, 14.0, 7.0, 14.0, 5.0, 2.0, 7.0, 2.0, 1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 0.0, 2.0], "bins": [-2.41796875, -2.3460693359375, -2.274169921875, -2.2022705078125, -2.13037109375, -2.0584716796875, -1.986572265625, -1.9146728515625, -1.8427734375, -1.7708740234375, -1.698974609375, -1.6270751953125, -1.55517578125, -1.4832763671875, -1.411376953125, -1.3394775390625, -1.267578125, -1.1956787109375, -1.123779296875, -1.0518798828125, -0.97998046875, -0.9080810546875, -0.836181640625, -0.7642822265625, -0.6923828125, -0.6204833984375, -0.548583984375, -0.4766845703125, -0.40478515625, -0.3328857421875, -0.260986328125, -0.1890869140625, -0.1171875, -0.0452880859375, 0.026611328125, 0.0985107421875, 0.17041015625, 0.2423095703125, 0.314208984375, 0.3861083984375, 0.4580078125, 0.5299072265625, 0.601806640625, 0.6737060546875, 0.74560546875, 0.8175048828125, 0.889404296875, 0.9613037109375, 1.033203125, 1.1051025390625, 1.177001953125, 1.2489013671875, 1.32080078125, 1.3927001953125, 1.464599609375, 1.5364990234375, 1.6083984375, 1.6802978515625, 1.752197265625, 1.8240966796875, 1.89599609375, 1.9678955078125, 2.039794921875, 2.1116943359375, 2.18359375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 9.0, 17.0, 7.0, 12.0, 17.0, 25.0, 51.0, 108.0, 154.0, 258.0, 687.0, 1762.0, 6811.0, 42689.0, 514503.0, 436070.0, 36304.0, 6151.0, 1624.0, 629.0, 297.0, 136.0, 76.0, 56.0, 42.0, 25.0, 13.0, 12.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.533203125, -2.453948974609375, -2.37469482421875, -2.295440673828125, -2.2161865234375, -2.136932373046875, -2.05767822265625, -1.978424072265625, -1.899169921875, -1.819915771484375, -1.74066162109375, -1.661407470703125, -1.5821533203125, -1.502899169921875, -1.42364501953125, -1.344390869140625, -1.26513671875, -1.185882568359375, -1.10662841796875, -1.027374267578125, -0.9481201171875, -0.868865966796875, -0.78961181640625, -0.710357666015625, -0.631103515625, -0.551849365234375, -0.47259521484375, -0.393341064453125, -0.3140869140625, -0.234832763671875, -0.15557861328125, -0.076324462890625, 0.0029296875, 0.082183837890625, 0.16143798828125, 0.240692138671875, 0.3199462890625, 0.399200439453125, 0.47845458984375, 0.557708740234375, 0.636962890625, 0.716217041015625, 0.79547119140625, 0.874725341796875, 0.9539794921875, 1.033233642578125, 1.11248779296875, 1.191741943359375, 1.27099609375, 1.350250244140625, 1.42950439453125, 1.508758544921875, 1.5880126953125, 1.667266845703125, 1.74652099609375, 1.825775146484375, 1.905029296875, 1.984283447265625, 2.06353759765625, 2.142791748046875, 2.2220458984375, 2.301300048828125, 2.38055419921875, 2.459808349609375, 2.5390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 3.0, 10.0, 10.0, 11.0, 14.0, 21.0, 15.0, 17.0, 28.0, 37.0, 43.0, 64.0, 73.0, 86.0, 96.0, 85.0, 60.0, 60.0, 54.0, 37.0, 34.0, 28.0, 19.0, 11.0, 15.0, 10.0, 9.0, 11.0, 3.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00015234947204589844, -0.00014765188097953796, -0.0001429542899131775, -0.00013825669884681702, -0.00013355910778045654, -0.00012886151671409607, -0.0001241639256477356, -0.00011946633458137512, -0.00011476874351501465, -0.00011007115244865417, -0.0001053735613822937, -0.00010067597031593323, -9.597837924957275e-05, -9.128078818321228e-05, -8.65831971168518e-05, -8.188560605049133e-05, -7.718801498413086e-05, -7.249042391777039e-05, -6.779283285140991e-05, -6.309524178504944e-05, -5.8397650718688965e-05, -5.370005965232849e-05, -4.900246858596802e-05, -4.4304877519607544e-05, -3.960728645324707e-05, -3.49096953868866e-05, -3.0212104320526123e-05, -2.551451325416565e-05, -2.0816922187805176e-05, -1.6119331121444702e-05, -1.1421740055084229e-05, -6.724148988723755e-06, -2.0265579223632812e-06, 2.6710331439971924e-06, 7.368624210357666e-06, 1.206621527671814e-05, 1.6763806343078613e-05, 2.1461397409439087e-05, 2.615898847579956e-05, 3.0856579542160034e-05, 3.555417060852051e-05, 4.025176167488098e-05, 4.4949352741241455e-05, 4.964694380760193e-05, 5.43445348739624e-05, 5.9042125940322876e-05, 6.373971700668335e-05, 6.843730807304382e-05, 7.31348991394043e-05, 7.783249020576477e-05, 8.253008127212524e-05, 8.722767233848572e-05, 9.192526340484619e-05, 9.662285447120667e-05, 0.00010132044553756714, 0.00010601803660392761, 0.00011071562767028809, 0.00011541321873664856, 0.00012011080980300903, 0.0001248084008693695, 0.00012950599193572998, 0.00013420358300209045, 0.00013890117406845093, 0.0001435987651348114, 0.00014829635620117188]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 3.0, 10.0, 14.0, 6.0, 16.0, 17.0, 31.0, 35.0, 63.0, 72.0, 136.0, 240.0, 372.0, 706.0, 1615.0, 4038.0, 12488.0, 48017.0, 248672.0, 574760.0, 118016.0, 26556.0, 7526.0, 2610.0, 1076.0, 596.0, 299.0, 192.0, 126.0, 83.0, 40.0, 32.0, 22.0, 12.0, 14.0, 13.0, 9.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.783203125, -1.7279815673828125, -1.672760009765625, -1.6175384521484375, -1.56231689453125, -1.5070953369140625, -1.451873779296875, -1.3966522216796875, -1.3414306640625, -1.2862091064453125, -1.230987548828125, -1.1757659912109375, -1.12054443359375, -1.0653228759765625, -1.010101318359375, -0.9548797607421875, -0.899658203125, -0.8444366455078125, -0.789215087890625, -0.7339935302734375, -0.67877197265625, -0.6235504150390625, -0.568328857421875, -0.5131072998046875, -0.4578857421875, -0.4026641845703125, -0.347442626953125, -0.2922210693359375, -0.23699951171875, -0.1817779541015625, -0.126556396484375, -0.0713348388671875, -0.01611328125, 0.0391082763671875, 0.094329833984375, 0.1495513916015625, 0.20477294921875, 0.2599945068359375, 0.315216064453125, 0.3704376220703125, 0.4256591796875, 0.4808807373046875, 0.536102294921875, 0.5913238525390625, 0.64654541015625, 0.7017669677734375, 0.756988525390625, 0.8122100830078125, 0.867431640625, 0.9226531982421875, 0.977874755859375, 1.0330963134765625, 1.08831787109375, 1.1435394287109375, 1.198760986328125, 1.2539825439453125, 1.3092041015625, 1.3644256591796875, 1.419647216796875, 1.4748687744140625, 1.53009033203125, 1.5853118896484375, 1.640533447265625, 1.6957550048828125, 1.7509765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 2.0, 7.0, 9.0, 7.0, 12.0, 18.0, 25.0, 14.0, 22.0, 42.0, 34.0, 40.0, 55.0, 73.0, 81.0, 81.0, 73.0, 66.0, 56.0, 43.0, 50.0, 39.0, 26.0, 16.0, 17.0, 16.0, 10.0, 15.0, 9.0, 7.0, 5.0, 4.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.12890625, -1.0963516235351562, -1.0637969970703125, -1.0312423706054688, -0.998687744140625, -0.9661331176757812, -0.9335784912109375, -0.9010238647460938, -0.86846923828125, -0.8359146118164062, -0.8033599853515625, -0.7708053588867188, -0.738250732421875, -0.7056961059570312, -0.6731414794921875, -0.6405868530273438, -0.6080322265625, -0.5754776000976562, -0.5429229736328125, -0.5103683471679688, -0.477813720703125, -0.44525909423828125, -0.4127044677734375, -0.38014984130859375, -0.34759521484375, -0.31504058837890625, -0.2824859619140625, -0.24993133544921875, -0.217376708984375, -0.18482208251953125, -0.1522674560546875, -0.11971282958984375, -0.087158203125, -0.05460357666015625, -0.0220489501953125, 0.01050567626953125, 0.043060302734375, 0.07561492919921875, 0.1081695556640625, 0.14072418212890625, 0.17327880859375, 0.20583343505859375, 0.2383880615234375, 0.27094268798828125, 0.303497314453125, 0.33605194091796875, 0.3686065673828125, 0.40116119384765625, 0.4337158203125, 0.46627044677734375, 0.4988250732421875, 0.5313796997070312, 0.563934326171875, 0.5964889526367188, 0.6290435791015625, 0.6615982055664062, 0.69415283203125, 0.7267074584960938, 0.7592620849609375, 0.7918167114257812, 0.824371337890625, 0.8569259643554688, 0.8894805908203125, 0.9220352172851562, 0.95458984375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 7.0, 11.0, 13.0, 15.0, 39.0, 66.0, 152.0, 243.0, 220.0, 105.0, 59.0, 30.0, 20.0, 8.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.741256713867188, -19.963449478149414, -19.185644149780273, -18.4078369140625, -17.63003158569336, -16.852224349975586, -16.074417114257812, -15.296610832214355, -14.518804550170898, -13.740998268127441, -12.963191986083984, -12.185384750366211, -11.407578468322754, -10.629772186279297, -9.851964950561523, -9.074158668518066, -8.29635238647461, -7.518546104431152, -6.740739345550537, -5.962932586669922, -5.185126304626465, -4.407320022583008, -3.6295132637023926, -2.8517065048217773, -2.0739002227783203, -1.2960937023162842, -0.518287181854248, 0.2595193386077881, 1.0373258590698242, 1.8151323795318604, 2.5929388999938965, 3.3707456588745117, 4.148550033569336, 4.926356315612793, 5.704163074493408, 6.481969833374023, 7.2597761154174805, 8.037582397460938, 8.815389633178711, 9.593195915222168, 10.371002197265625, 11.148808479309082, 11.926614761352539, 12.704421997070312, 13.48222827911377, 14.260034561157227, 15.037841796875, 15.815648078918457, 16.593454360961914, 17.371261596679688, 18.149066925048828, 18.9268741607666, 19.704681396484375, 20.482486724853516, 21.26029396057129, 22.038101196289062, 22.815906524658203, 23.593713760375977, 24.371519088745117, 25.14932632446289, 25.92713165283203, 26.704938888549805, 27.482746124267578, 28.26055145263672, 29.038358688354492]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 4.0, 11.0, 10.0, 10.0, 15.0, 22.0, 33.0, 31.0, 41.0, 49.0, 53.0, 56.0, 69.0, 69.0, 64.0, 64.0, 67.0, 52.0, 42.0, 46.0, 43.0, 37.0, 25.0, 23.0, 20.0, 12.0, 11.0, 10.0, 6.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.89222526550293, -20.089824676513672, -19.287424087524414, -18.485023498535156, -17.682621002197266, -16.880220413208008, -16.07781982421875, -15.275419235229492, -14.473017692565918, -13.67061710357666, -12.868215560913086, -12.065814971923828, -11.26341438293457, -10.461012840270996, -9.658612251281738, -8.856210708618164, -8.053810119628906, -7.25140905380249, -6.449007987976074, -5.646607398986816, -4.8442063331604, -4.041805267333984, -3.2394046783447266, -2.4370036125183105, -1.6346025466918945, -0.8322016000747681, -0.0298006534576416, 0.7726001739501953, 1.5750012397766113, 2.3774023056030273, 3.179802894592285, 3.982203960418701, 4.78460693359375, 5.587007999420166, 6.389409065246582, 7.19180965423584, 7.994210720062256, 8.796611785888672, 9.59901237487793, 10.401412963867188, 11.203814506530762, 12.00621509552002, 12.808616638183594, 13.611017227172852, 14.41341781616211, 15.215819358825684, 16.018218994140625, 16.820621490478516, 17.623022079467773, 18.42542266845703, 19.22782325744629, 20.030223846435547, 20.832626342773438, 21.635026931762695, 22.437427520751953, 23.23982810974121, 24.04222869873047, 24.844629287719727, 25.647029876708984, 26.449432373046875, 27.251832962036133, 28.05423355102539, 28.85663414001465, 29.659034729003906, 30.461437225341797]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 7.0, 12.0, 27.0, 26.0, 72.0, 210.0, 756.0, 7946.0, 4166263.0, 16832.0, 1372.0, 392.0, 181.0, 75.0, 37.0, 25.0, 16.0, 8.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.71875, -23.712890625, -22.70703125, -21.701171875, -20.6953125, -19.689453125, -18.68359375, -17.677734375, -16.671875, -15.666015625, -14.66015625, -13.654296875, -12.6484375, -11.642578125, -10.63671875, -9.630859375, -8.625, -7.619140625, -6.61328125, -5.607421875, -4.6015625, -3.595703125, -2.58984375, -1.583984375, -0.578125, 0.427734375, 1.43359375, 2.439453125, 3.4453125, 4.451171875, 5.45703125, 6.462890625, 7.46875, 8.474609375, 9.48046875, 10.486328125, 11.4921875, 12.498046875, 13.50390625, 14.509765625, 15.515625, 16.521484375, 17.52734375, 18.533203125, 19.5390625, 20.544921875, 21.55078125, 22.556640625, 23.5625, 24.568359375, 25.57421875, 26.580078125, 27.5859375, 28.591796875, 29.59765625, 30.603515625, 31.609375, 32.615234375, 33.62109375, 34.626953125, 35.6328125, 36.638671875, 37.64453125, 38.650390625, 39.65625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 9.0, 17.0, 12.0, 23.0, 43.0, 89.0, 119.0, 146.0, 142.0, 136.0, 85.0, 57.0, 44.0, 23.0, 15.0, 8.0, 10.0, 0.0, 4.0, 1.0, 2.0, 3.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.775390625, -0.7436065673828125, -0.711822509765625, -0.6800384521484375, -0.64825439453125, -0.6164703369140625, -0.584686279296875, -0.5529022216796875, -0.5211181640625, -0.4893341064453125, -0.457550048828125, -0.4257659912109375, -0.39398193359375, -0.3621978759765625, -0.330413818359375, -0.2986297607421875, -0.266845703125, -0.2350616455078125, -0.203277587890625, -0.1714935302734375, -0.13970947265625, -0.1079254150390625, -0.076141357421875, -0.0443572998046875, -0.0125732421875, 0.0192108154296875, 0.050994873046875, 0.0827789306640625, 0.11456298828125, 0.1463470458984375, 0.178131103515625, 0.2099151611328125, 0.24169921875, 0.2734832763671875, 0.305267333984375, 0.3370513916015625, 0.36883544921875, 0.4006195068359375, 0.432403564453125, 0.4641876220703125, 0.4959716796875, 0.5277557373046875, 0.559539794921875, 0.5913238525390625, 0.62310791015625, 0.6548919677734375, 0.686676025390625, 0.7184600830078125, 0.750244140625, 0.7820281982421875, 0.813812255859375, 0.8455963134765625, 0.87738037109375, 0.9091644287109375, 0.940948486328125, 0.9727325439453125, 1.0045166015625, 1.0363006591796875, 1.068084716796875, 1.0998687744140625, 1.13165283203125, 1.1634368896484375, 1.195220947265625, 1.2270050048828125, 1.2587890625]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 8.0, 7.0, 8.0, 9.0, 13.0, 15.0, 27.0, 24.0, 23.0, 30.0, 35.0, 66.0, 123.0, 260.0, 867.0, 5075.0, 104089.0, 4048587.0, 31224.0, 2593.0, 566.0, 202.0, 83.0, 57.0, 46.0, 33.0, 31.0, 25.0, 18.0, 34.0, 16.0, 15.0, 8.0, 11.0, 8.0, 8.0, 6.0, 4.0, 3.0, 4.0, 6.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-10.359375, -10.0391845703125, -9.718994140625, -9.3988037109375, -9.07861328125, -8.7584228515625, -8.438232421875, -8.1180419921875, -7.7978515625, -7.4776611328125, -7.157470703125, -6.8372802734375, -6.51708984375, -6.1968994140625, -5.876708984375, -5.5565185546875, -5.236328125, -4.9161376953125, -4.595947265625, -4.2757568359375, -3.95556640625, -3.6353759765625, -3.315185546875, -2.9949951171875, -2.6748046875, -2.3546142578125, -2.034423828125, -1.7142333984375, -1.39404296875, -1.0738525390625, -0.753662109375, -0.4334716796875, -0.11328125, 0.2069091796875, 0.527099609375, 0.8472900390625, 1.16748046875, 1.4876708984375, 1.807861328125, 2.1280517578125, 2.4482421875, 2.7684326171875, 3.088623046875, 3.4088134765625, 3.72900390625, 4.0491943359375, 4.369384765625, 4.6895751953125, 5.009765625, 5.3299560546875, 5.650146484375, 5.9703369140625, 6.29052734375, 6.6107177734375, 6.930908203125, 7.2510986328125, 7.5712890625, 7.8914794921875, 8.211669921875, 8.5318603515625, 8.85205078125, 9.1722412109375, 9.492431640625, 9.8126220703125, 10.1328125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 2.0, 4.0, 10.0, 25.0, 36.0, 63.0, 176.0, 546.0, 2303.0, 585.0, 174.0, 75.0, 30.0, 19.0, 11.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.14453125, -1.082611083984375, -1.02069091796875, -0.958770751953125, -0.8968505859375, -0.834930419921875, -0.77301025390625, -0.711090087890625, -0.649169921875, -0.587249755859375, -0.52532958984375, -0.463409423828125, -0.4014892578125, -0.339569091796875, -0.27764892578125, -0.215728759765625, -0.15380859375, -0.091888427734375, -0.02996826171875, 0.031951904296875, 0.0938720703125, 0.155792236328125, 0.21771240234375, 0.279632568359375, 0.341552734375, 0.403472900390625, 0.46539306640625, 0.527313232421875, 0.5892333984375, 0.651153564453125, 0.71307373046875, 0.774993896484375, 0.8369140625, 0.898834228515625, 0.96075439453125, 1.022674560546875, 1.0845947265625, 1.146514892578125, 1.20843505859375, 1.270355224609375, 1.332275390625, 1.394195556640625, 1.45611572265625, 1.518035888671875, 1.5799560546875, 1.641876220703125, 1.70379638671875, 1.765716552734375, 1.82763671875, 1.889556884765625, 1.95147705078125, 2.013397216796875, 2.0753173828125, 2.137237548828125, 2.19915771484375, 2.261077880859375, 2.322998046875, 2.384918212890625, 2.44683837890625, 2.508758544921875, 2.5706787109375, 2.632598876953125, 2.69451904296875, 2.756439208984375, 2.818359375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 21.0, 109.0, 502.0, 304.0, 49.0, 12.0, 4.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.939613342285156, -29.271146774291992, -28.602680206298828, -27.934213638305664, -27.2657470703125, -26.597280502319336, -25.928813934326172, -25.260347366333008, -24.591880798339844, -23.92341423034668, -23.254947662353516, -22.58648109436035, -21.918014526367188, -21.249547958374023, -20.58108139038086, -19.912614822387695, -19.24414825439453, -18.575681686401367, -17.907215118408203, -17.23874855041504, -16.570281982421875, -15.901815414428711, -15.233348846435547, -14.564882278442383, -13.896415710449219, -13.227949142456055, -12.55948257446289, -11.891016006469727, -11.222549438476562, -10.554082870483398, -9.885616302490234, -9.21714973449707, -8.548681259155273, -7.880214691162109, -7.211748123168945, -6.543281555175781, -5.874814987182617, -5.206348419189453, -4.537881851196289, -3.869415283203125, -3.200948715209961, -2.532482147216797, -1.8640155792236328, -1.1955490112304688, -0.5270824432373047, 0.14138412475585938, 0.8098506927490234, 1.4783172607421875, 2.1467838287353516, 2.8152503967285156, 3.4837169647216797, 4.152183532714844, 4.820650100708008, 5.489116668701172, 6.157583236694336, 6.8260498046875, 7.494516372680664, 8.162982940673828, 8.831449508666992, 9.499916076660156, 10.16838264465332, 10.836849212646484, 11.505315780639648, 12.173782348632812, 12.842248916625977]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 10.0, 12.0, 22.0, 17.0, 19.0, 33.0, 37.0, 44.0, 55.0, 67.0, 78.0, 89.0, 81.0, 74.0, 61.0, 65.0, 57.0, 40.0, 29.0, 31.0, 19.0, 19.0, 12.0, 9.0, 8.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6302409172058105, -6.434739589691162, -6.239238262176514, -6.043736457824707, -5.848235130310059, -5.65273380279541, -5.457232475280762, -5.261731147766113, -5.066229820251465, -4.870728492736816, -4.675227165222168, -4.4797258377075195, -4.284224033355713, -4.0887227058410645, -3.893221378326416, -3.6977200508117676, -3.50221848487854, -3.3067171573638916, -3.111215591430664, -2.9157142639160156, -2.720212936401367, -2.5247116088867188, -2.329210042953491, -2.1337087154388428, -1.9382072687149048, -1.7427058219909668, -1.5472044944763184, -1.3517030477523804, -1.1562016010284424, -0.960700273513794, -0.765198826789856, -0.5696974992752075, -0.37419605255126953, -0.17869465053081512, 0.016806751489639282, 0.21230816841125488, 0.4078095555305481, 0.6033109426498413, 0.7988123893737793, 0.9943137168884277, 1.1898151636123657, 1.3853166103363037, 1.5808179378509521, 1.7763193845748901, 1.9718208312988281, 2.1673221588134766, 2.362823486328125, 2.5583248138427734, 2.753826379776001, 2.9493277072906494, 3.144829273223877, 3.3403306007385254, 3.535831928253174, 3.7313332557678223, 3.92683482170105, 4.122336387634277, 4.317837715148926, 4.513339042663574, 4.708840370178223, 4.904341697692871, 5.099843502044678, 5.295344829559326, 5.490846157073975, 5.686347484588623, 5.8818488121032715]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 2.0, 2.0, 7.0, 8.0, 10.0, 9.0, 25.0, 44.0, 67.0, 123.0, 170.0, 349.0, 747.0, 2179.0, 7782.0, 67997.0, 806653.0, 145734.0, 11821.0, 2861.0, 1021.0, 434.0, 208.0, 106.0, 70.0, 41.0, 38.0, 17.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.16015625, -5.958984375, -5.7578125, -5.556640625, -5.35546875, -5.154296875, -4.953125, -4.751953125, -4.55078125, -4.349609375, -4.1484375, -3.947265625, -3.74609375, -3.544921875, -3.34375, -3.142578125, -2.94140625, -2.740234375, -2.5390625, -2.337890625, -2.13671875, -1.935546875, -1.734375, -1.533203125, -1.33203125, -1.130859375, -0.9296875, -0.728515625, -0.52734375, -0.326171875, -0.125, 0.076171875, 0.27734375, 0.478515625, 0.6796875, 0.880859375, 1.08203125, 1.283203125, 1.484375, 1.685546875, 1.88671875, 2.087890625, 2.2890625, 2.490234375, 2.69140625, 2.892578125, 3.09375, 3.294921875, 3.49609375, 3.697265625, 3.8984375, 4.099609375, 4.30078125, 4.501953125, 4.703125, 4.904296875, 5.10546875, 5.306640625, 5.5078125, 5.708984375, 5.91015625, 6.111328125, 6.3125, 6.513671875, 6.71484375]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 8.0, 7.0, 20.0, 43.0, 48.0, 90.0, 134.0, 148.0, 120.0, 118.0, 77.0, 76.0, 38.0, 22.0, 12.0, 6.0, 6.0, 3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6462173461914062, -0.6171417236328125, -0.5880661010742188, -0.558990478515625, -0.5299148559570312, -0.5008392333984375, -0.47176361083984375, -0.44268798828125, -0.41361236572265625, -0.3845367431640625, -0.35546112060546875, -0.326385498046875, -0.29730987548828125, -0.2682342529296875, -0.23915863037109375, -0.2100830078125, -0.18100738525390625, -0.1519317626953125, -0.12285614013671875, -0.093780517578125, -0.06470489501953125, -0.0356292724609375, -0.00655364990234375, 0.02252197265625, 0.05159759521484375, 0.0806732177734375, 0.10974884033203125, 0.138824462890625, 0.16790008544921875, 0.1969757080078125, 0.22605133056640625, 0.255126953125, 0.28420257568359375, 0.3132781982421875, 0.34235382080078125, 0.371429443359375, 0.40050506591796875, 0.4295806884765625, 0.45865631103515625, 0.48773193359375, 0.5168075561523438, 0.5458831787109375, 0.5749588012695312, 0.604034423828125, 0.6331100463867188, 0.6621856689453125, 0.6912612915039062, 0.7203369140625, 0.7494125366210938, 0.7784881591796875, 0.8075637817382812, 0.836639404296875, 0.8657150268554688, 0.8947906494140625, 0.9238662719726562, 0.95294189453125, 0.9820175170898438, 1.0110931396484375, 1.0401687622070312, 1.069244384765625, 1.0983200073242188, 1.1273956298828125, 1.1564712524414062, 1.185546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 8.0, 4.0, 14.0, 25.0, 27.0, 39.0, 58.0, 72.0, 108.0, 147.0, 249.0, 411.0, 651.0, 1353.0, 3340.0, 9247.0, 31703.0, 136593.0, 515061.0, 268158.0, 56528.0, 15260.0, 4999.0, 2023.0, 959.0, 545.0, 312.0, 208.0, 130.0, 99.0, 67.0, 48.0, 23.0, 16.0, 23.0, 19.0, 4.0, 2.0, 9.0, 5.0, 2.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.845703125, -2.74658203125, -2.6474609375, -2.54833984375, -2.44921875, -2.35009765625, -2.2509765625, -2.15185546875, -2.052734375, -1.95361328125, -1.8544921875, -1.75537109375, -1.65625, -1.55712890625, -1.4580078125, -1.35888671875, -1.259765625, -1.16064453125, -1.0615234375, -0.96240234375, -0.86328125, -0.76416015625, -0.6650390625, -0.56591796875, -0.466796875, -0.36767578125, -0.2685546875, -0.16943359375, -0.0703125, 0.02880859375, 0.1279296875, 0.22705078125, 0.326171875, 0.42529296875, 0.5244140625, 0.62353515625, 0.72265625, 0.82177734375, 0.9208984375, 1.02001953125, 1.119140625, 1.21826171875, 1.3173828125, 1.41650390625, 1.515625, 1.61474609375, 1.7138671875, 1.81298828125, 1.912109375, 2.01123046875, 2.1103515625, 2.20947265625, 2.30859375, 2.40771484375, 2.5068359375, 2.60595703125, 2.705078125, 2.80419921875, 2.9033203125, 3.00244140625, 3.1015625, 3.20068359375, 3.2998046875, 3.39892578125, 3.498046875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 3.0, 3.0, 9.0, 8.0, 10.0, 12.0, 15.0, 18.0, 20.0, 37.0, 20.0, 52.0, 35.0, 37.0, 61.0, 48.0, 53.0, 55.0, 49.0, 47.0, 42.0, 47.0, 42.0, 39.0, 42.0, 39.0, 29.0, 26.0, 23.0, 19.0, 18.0, 12.0, 3.0, 13.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.712890625, -2.61712646484375, -2.5213623046875, -2.42559814453125, -2.329833984375, -2.23406982421875, -2.1383056640625, -2.04254150390625, -1.94677734375, -1.85101318359375, -1.7552490234375, -1.65948486328125, -1.563720703125, -1.46795654296875, -1.3721923828125, -1.27642822265625, -1.1806640625, -1.08489990234375, -0.9891357421875, -0.89337158203125, -0.797607421875, -0.70184326171875, -0.6060791015625, -0.51031494140625, -0.41455078125, -0.31878662109375, -0.2230224609375, -0.12725830078125, -0.031494140625, 0.06427001953125, 0.1600341796875, 0.25579833984375, 0.3515625, 0.44732666015625, 0.5430908203125, 0.63885498046875, 0.734619140625, 0.83038330078125, 0.9261474609375, 1.02191162109375, 1.11767578125, 1.21343994140625, 1.3092041015625, 1.40496826171875, 1.500732421875, 1.59649658203125, 1.6922607421875, 1.78802490234375, 1.8837890625, 1.97955322265625, 2.0753173828125, 2.17108154296875, 2.266845703125, 2.36260986328125, 2.4583740234375, 2.55413818359375, 2.64990234375, 2.74566650390625, 2.8414306640625, 2.93719482421875, 3.032958984375, 3.12872314453125, 3.2244873046875, 3.32025146484375, 3.416015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 8.0, 10.0, 18.0, 23.0, 47.0, 92.0, 195.0, 478.0, 1496.0, 8091.0, 106593.0, 821121.0, 100386.0, 7746.0, 1420.0, 453.0, 159.0, 92.0, 48.0, 38.0, 16.0, 8.0, 4.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.654296875, -2.572601318359375, -2.49090576171875, -2.409210205078125, -2.3275146484375, -2.245819091796875, -2.16412353515625, -2.082427978515625, -2.000732421875, -1.919036865234375, -1.83734130859375, -1.755645751953125, -1.6739501953125, -1.592254638671875, -1.51055908203125, -1.428863525390625, -1.34716796875, -1.265472412109375, -1.18377685546875, -1.102081298828125, -1.0203857421875, -0.938690185546875, -0.85699462890625, -0.775299072265625, -0.693603515625, -0.611907958984375, -0.53021240234375, -0.448516845703125, -0.3668212890625, -0.285125732421875, -0.20343017578125, -0.121734619140625, -0.0400390625, 0.041656494140625, 0.12335205078125, 0.205047607421875, 0.2867431640625, 0.368438720703125, 0.45013427734375, 0.531829833984375, 0.613525390625, 0.695220947265625, 0.77691650390625, 0.858612060546875, 0.9403076171875, 1.022003173828125, 1.10369873046875, 1.185394287109375, 1.26708984375, 1.348785400390625, 1.43048095703125, 1.512176513671875, 1.5938720703125, 1.675567626953125, 1.75726318359375, 1.838958740234375, 1.920654296875, 2.002349853515625, 2.08404541015625, 2.165740966796875, 2.2474365234375, 2.329132080078125, 2.41082763671875, 2.492523193359375, 2.57421875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 4.0, 3.0, 3.0, 3.0, 20.0, 11.0, 11.0, 12.0, 16.0, 25.0, 16.0, 30.0, 35.0, 44.0, 63.0, 111.0, 132.0, 115.0, 71.0, 54.0, 44.0, 36.0, 17.0, 17.0, 17.0, 14.0, 11.0, 16.0, 11.0, 6.0, 2.0, 5.0, 4.0, 5.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0001995563507080078, -0.00019362196326255798, -0.00018768757581710815, -0.00018175318837165833, -0.0001758188009262085, -0.00016988441348075867, -0.00016395002603530884, -0.000158015638589859, -0.00015208125114440918, -0.00014614686369895935, -0.00014021247625350952, -0.0001342780888080597, -0.00012834370136260986, -0.00012240931391716003, -0.0001164749264717102, -0.00011054053902626038, -0.00010460615158081055, -9.867176413536072e-05, -9.273737668991089e-05, -8.680298924446106e-05, -8.086860179901123e-05, -7.49342143535614e-05, -6.899982690811157e-05, -6.306543946266174e-05, -5.7131052017211914e-05, -5.1196664571762085e-05, -4.5262277126312256e-05, -3.932788968086243e-05, -3.33935022354126e-05, -2.745911478996277e-05, -2.152472734451294e-05, -1.559033989906311e-05, -9.655952453613281e-06, -3.721565008163452e-06, 2.212822437286377e-06, 8.147209882736206e-06, 1.4081597328186035e-05, 2.0015984773635864e-05, 2.5950372219085693e-05, 3.188475966453552e-05, 3.781914710998535e-05, 4.375353455543518e-05, 4.968792200088501e-05, 5.562230944633484e-05, 6.155669689178467e-05, 6.74910843372345e-05, 7.342547178268433e-05, 7.935985922813416e-05, 8.529424667358398e-05, 9.122863411903381e-05, 9.716302156448364e-05, 0.00010309740900993347, 0.0001090317964553833, 0.00011496618390083313, 0.00012090057134628296, 0.0001268349587917328, 0.00013276934623718262, 0.00013870373368263245, 0.00014463812112808228, 0.0001505725085735321, 0.00015650689601898193, 0.00016244128346443176, 0.0001683756709098816, 0.00017431005835533142, 0.00018024444580078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 15.0, 19.0, 28.0, 51.0, 71.0, 131.0, 242.0, 440.0, 971.0, 2247.0, 6741.0, 32078.0, 242230.0, 640314.0, 100299.0, 15580.0, 4217.0, 1492.0, 658.0, 319.0, 170.0, 82.0, 50.0, 31.0, 17.0, 10.0, 9.0, 5.0, 9.0, 3.0, 8.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8515625, -1.792388916015625, -1.73321533203125, -1.674041748046875, -1.6148681640625, -1.555694580078125, -1.49652099609375, -1.437347412109375, -1.378173828125, -1.319000244140625, -1.25982666015625, -1.200653076171875, -1.1414794921875, -1.082305908203125, -1.02313232421875, -0.963958740234375, -0.90478515625, -0.845611572265625, -0.78643798828125, -0.727264404296875, -0.6680908203125, -0.608917236328125, -0.54974365234375, -0.490570068359375, -0.431396484375, -0.372222900390625, -0.31304931640625, -0.253875732421875, -0.1947021484375, -0.135528564453125, -0.07635498046875, -0.017181396484375, 0.0419921875, 0.101165771484375, 0.16033935546875, 0.219512939453125, 0.2786865234375, 0.337860107421875, 0.39703369140625, 0.456207275390625, 0.515380859375, 0.574554443359375, 0.63372802734375, 0.692901611328125, 0.7520751953125, 0.811248779296875, 0.87042236328125, 0.929595947265625, 0.98876953125, 1.047943115234375, 1.10711669921875, 1.166290283203125, 1.2254638671875, 1.284637451171875, 1.34381103515625, 1.402984619140625, 1.462158203125, 1.521331787109375, 1.58050537109375, 1.639678955078125, 1.6988525390625, 1.758026123046875, 1.81719970703125, 1.876373291015625, 1.935546875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 1.0, 4.0, 5.0, 3.0, 5.0, 11.0, 5.0, 12.0, 19.0, 25.0, 37.0, 24.0, 40.0, 48.0, 68.0, 76.0, 72.0, 88.0, 75.0, 82.0, 76.0, 49.0, 34.0, 33.0, 32.0, 20.0, 13.0, 14.0, 11.0, 7.0, 3.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97607421875, -0.9451217651367188, -0.9141693115234375, -0.8832168579101562, -0.852264404296875, -0.8213119506835938, -0.7903594970703125, -0.7594070434570312, -0.72845458984375, -0.6975021362304688, -0.6665496826171875, -0.6355972290039062, -0.604644775390625, -0.5736923217773438, -0.5427398681640625, -0.5117874145507812, -0.4808349609375, -0.44988250732421875, -0.4189300537109375, -0.38797760009765625, -0.357025146484375, -0.32607269287109375, -0.2951202392578125, -0.26416778564453125, -0.23321533203125, -0.20226287841796875, -0.1713104248046875, -0.14035797119140625, -0.109405517578125, -0.07845306396484375, -0.0475006103515625, -0.01654815673828125, 0.014404296875, 0.04535675048828125, 0.0763092041015625, 0.10726165771484375, 0.138214111328125, 0.16916656494140625, 0.2001190185546875, 0.23107147216796875, 0.26202392578125, 0.29297637939453125, 0.3239288330078125, 0.35488128662109375, 0.385833740234375, 0.41678619384765625, 0.4477386474609375, 0.47869110107421875, 0.5096435546875, 0.5405960083007812, 0.5715484619140625, 0.6025009155273438, 0.633453369140625, 0.6644058227539062, 0.6953582763671875, 0.7263107299804688, 0.75726318359375, 0.7882156372070312, 0.8191680908203125, 0.8501205444335938, 0.881072998046875, 0.9120254516601562, 0.9429779052734375, 0.9739303588867188, 1.0048828125]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 5.0, 16.0, 22.0, 71.0, 224.0, 335.0, 200.0, 75.0, 36.0, 12.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.366262435913086, -29.260591506958008, -28.15492057800293, -27.04924964904785, -25.943578720092773, -24.837907791137695, -23.73223876953125, -22.626567840576172, -21.520896911621094, -20.415225982666016, -19.309555053710938, -18.20388412475586, -17.09821319580078, -15.992542266845703, -14.886872291564941, -13.781201362609863, -12.675529479980469, -11.56985855102539, -10.464187622070312, -9.358516693115234, -8.252845764160156, -7.147175312042236, -6.041504859924316, -4.935833930969238, -3.83016300201416, -2.724492073059082, -1.618821382522583, -0.513150691986084, 0.5925202369689941, 1.6981911659240723, 2.803861618041992, 3.9095325469970703, 5.015201568603516, 6.120872497558594, 7.226543426513672, 8.33221435546875, 9.437885284423828, 10.543556213378906, 11.649226188659668, 12.754897117614746, 13.860568046569824, 14.966238975524902, 16.071908950805664, 17.177579879760742, 18.28325080871582, 19.3889217376709, 20.494592666625977, 21.600263595581055, 22.705934524536133, 23.81160545349121, 24.91727638244629, 26.022947311401367, 27.128618240356445, 28.234289169311523, 29.33995819091797, 30.445629119873047, 31.551300048828125, 32.6569709777832, 33.76264190673828, 34.86831283569336, 35.97398376464844, 37.079654693603516, 38.185325622558594, 39.29099655151367, 40.39666748046875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 2.0, 6.0, 4.0, 2.0, 4.0, 2.0, 10.0, 6.0, 16.0, 20.0, 19.0, 18.0, 22.0, 28.0, 38.0, 29.0, 36.0, 34.0, 37.0, 55.0, 43.0, 43.0, 36.0, 43.0, 45.0, 47.0, 43.0, 54.0, 40.0, 48.0, 28.0, 29.0, 18.0, 20.0, 28.0, 17.0, 10.0, 12.0, 6.0, 2.0, 2.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-21.32120704650879, -20.749475479125977, -20.17774200439453, -19.60601043701172, -19.034278869628906, -18.462547302246094, -17.89081382751465, -17.319082260131836, -16.74734878540039, -16.175617218017578, -15.60388469696045, -15.03215217590332, -14.460420608520508, -13.888688087463379, -13.31695556640625, -12.745223999023438, -12.173492431640625, -11.601759910583496, -11.030028343200684, -10.458295822143555, -9.886564254760742, -9.314831733703613, -8.743099212646484, -8.171367645263672, -7.599635124206543, -7.027903079986572, -6.456171035766602, -5.884438514709473, -5.312706470489502, -4.740974426269531, -4.169241905212402, -3.5975098609924316, -3.0257797241210938, -2.454047679901123, -1.8823153972625732, -1.310583233833313, -0.7388510704040527, -0.16711902618408203, 0.4046132564544678, 0.9763455390930176, 1.5480775833129883, 2.119809627532959, 2.691541910171509, 3.2632741928100586, 3.8350062370300293, 4.40673828125, 4.978470802307129, 5.5502028465271, 6.12193489074707, 6.693666934967041, 7.265398979187012, 7.837131500244141, 8.408863067626953, 8.980595588684082, 9.552328109741211, 10.124059677124023, 10.695792198181152, 11.267524719238281, 11.839256286621094, 12.410988807678223, 12.982721328735352, 13.554452896118164, 14.126185417175293, 14.697917938232422, 15.269649505615234]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 5.0, 8.0, 19.0, 18.0, 29.0, 51.0, 73.0, 125.0, 254.0, 545.0, 1328.0, 4297.0, 20984.0, 374518.0, 3732426.0, 46923.0, 8009.0, 2336.0, 927.0, 528.0, 272.0, 168.0, 121.0, 73.0, 57.0, 39.0, 29.0, 28.0, 10.0, 16.0, 11.0, 12.0, 5.0, 7.0, 6.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.26171875, -4.06060791015625, -3.8594970703125, -3.65838623046875, -3.457275390625, -3.25616455078125, -3.0550537109375, -2.85394287109375, -2.65283203125, -2.45172119140625, -2.2506103515625, -2.04949951171875, -1.848388671875, -1.64727783203125, -1.4461669921875, -1.24505615234375, -1.0439453125, -0.84283447265625, -0.6417236328125, -0.44061279296875, -0.239501953125, -0.03839111328125, 0.1627197265625, 0.36383056640625, 0.56494140625, 0.76605224609375, 0.9671630859375, 1.16827392578125, 1.369384765625, 1.57049560546875, 1.7716064453125, 1.97271728515625, 2.173828125, 2.37493896484375, 2.5760498046875, 2.77716064453125, 2.978271484375, 3.17938232421875, 3.3804931640625, 3.58160400390625, 3.78271484375, 3.98382568359375, 4.1849365234375, 4.38604736328125, 4.587158203125, 4.78826904296875, 4.9893798828125, 5.19049072265625, 5.3916015625, 5.59271240234375, 5.7938232421875, 5.99493408203125, 6.196044921875, 6.39715576171875, 6.5982666015625, 6.79937744140625, 7.00048828125, 7.20159912109375, 7.4027099609375, 7.60382080078125, 7.804931640625, 8.00604248046875, 8.2071533203125, 8.40826416015625, 8.609375]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 3.0, 10.0, 11.0, 12.0, 25.0, 40.0, 34.0, 61.0, 69.0, 99.0, 86.0, 96.0, 114.0, 72.0, 66.0, 63.0, 35.0, 38.0, 14.0, 20.0, 12.0, 5.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54833984375, -0.5202865600585938, -0.4922332763671875, -0.46417999267578125, -0.436126708984375, -0.40807342529296875, -0.3800201416015625, -0.35196685791015625, -0.32391357421875, -0.29586029052734375, -0.2678070068359375, -0.23975372314453125, -0.211700439453125, -0.18364715576171875, -0.1555938720703125, -0.12754058837890625, -0.0994873046875, -0.07143402099609375, -0.0433807373046875, -0.01532745361328125, 0.012725830078125, 0.04077911376953125, 0.0688323974609375, 0.09688568115234375, 0.12493896484375, 0.15299224853515625, 0.1810455322265625, 0.20909881591796875, 0.237152099609375, 0.26520538330078125, 0.2932586669921875, 0.32131195068359375, 0.349365234375, 0.37741851806640625, 0.4054718017578125, 0.43352508544921875, 0.461578369140625, 0.48963165283203125, 0.5176849365234375, 0.5457382202148438, 0.57379150390625, 0.6018447875976562, 0.6298980712890625, 0.6579513549804688, 0.686004638671875, 0.7140579223632812, 0.7421112060546875, 0.7701644897460938, 0.7982177734375, 0.8262710571289062, 0.8543243408203125, 0.8823776245117188, 0.910430908203125, 0.9384841918945312, 0.9665374755859375, 0.9945907592773438, 1.02264404296875, 1.0506973266601562, 1.0787506103515625, 1.1068038940429688, 1.134857177734375, 1.1629104614257812, 1.1909637451171875, 1.2190170288085938, 1.2470703125]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 17.0, 16.0, 23.0, 23.0, 20.0, 24.0, 35.0, 52.0, 64.0, 118.0, 213.0, 578.0, 5078.0, 1700403.0, 2480144.0, 5902.0, 706.0, 246.0, 161.0, 99.0, 74.0, 54.0, 36.0, 40.0, 24.0, 21.0, 26.0, 8.0, 20.0, 18.0, 5.0, 5.0, 8.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-12.28125, -11.940185546875, -11.59912109375, -11.258056640625, -10.9169921875, -10.575927734375, -10.23486328125, -9.893798828125, -9.552734375, -9.211669921875, -8.87060546875, -8.529541015625, -8.1884765625, -7.847412109375, -7.50634765625, -7.165283203125, -6.82421875, -6.483154296875, -6.14208984375, -5.801025390625, -5.4599609375, -5.118896484375, -4.77783203125, -4.436767578125, -4.095703125, -3.754638671875, -3.41357421875, -3.072509765625, -2.7314453125, -2.390380859375, -2.04931640625, -1.708251953125, -1.3671875, -1.026123046875, -0.68505859375, -0.343994140625, -0.0029296875, 0.338134765625, 0.67919921875, 1.020263671875, 1.361328125, 1.702392578125, 2.04345703125, 2.384521484375, 2.7255859375, 3.066650390625, 3.40771484375, 3.748779296875, 4.08984375, 4.430908203125, 4.77197265625, 5.113037109375, 5.4541015625, 5.795166015625, 6.13623046875, 6.477294921875, 6.818359375, 7.159423828125, 7.50048828125, 7.841552734375, 8.1826171875, 8.523681640625, 8.86474609375, 9.205810546875, 9.546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [5.0, 2.0, 8.0, 9.0, 14.0, 28.0, 64.0, 140.0, 452.0, 2392.0, 643.0, 164.0, 81.0, 35.0, 24.0, 12.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5732421875, -0.5135040283203125, -0.453765869140625, -0.3940277099609375, -0.33428955078125, -0.2745513916015625, -0.214813232421875, -0.1550750732421875, -0.0953369140625, -0.0355987548828125, 0.024139404296875, 0.0838775634765625, 0.14361572265625, 0.2033538818359375, 0.263092041015625, 0.3228302001953125, 0.382568359375, 0.4423065185546875, 0.502044677734375, 0.5617828369140625, 0.62152099609375, 0.6812591552734375, 0.740997314453125, 0.8007354736328125, 0.8604736328125, 0.9202117919921875, 0.979949951171875, 1.0396881103515625, 1.09942626953125, 1.1591644287109375, 1.218902587890625, 1.2786407470703125, 1.33837890625, 1.3981170654296875, 1.457855224609375, 1.5175933837890625, 1.57733154296875, 1.6370697021484375, 1.696807861328125, 1.7565460205078125, 1.8162841796875, 1.8760223388671875, 1.935760498046875, 1.9954986572265625, 2.05523681640625, 2.1149749755859375, 2.174713134765625, 2.2344512939453125, 2.294189453125, 2.3539276123046875, 2.413665771484375, 2.4734039306640625, 2.53314208984375, 2.5928802490234375, 2.652618408203125, 2.7123565673828125, 2.7720947265625, 2.8318328857421875, 2.891571044921875, 2.9513092041015625, 3.01104736328125, 3.0707855224609375, 3.130523681640625, 3.1902618408203125, 3.25]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 8.0, 20.0, 47.0, 148.0, 328.0, 264.0, 107.0, 45.0, 16.0, 8.0, 7.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.525618553161621, -8.193577766418457, -7.861537456512451, -7.529496669769287, -7.197455883026123, -6.865415573120117, -6.533374786376953, -6.201333999633789, -5.869293212890625, -5.537252426147461, -5.205212116241455, -4.873171329498291, -4.541130542755127, -4.209090232849121, -3.877049446105957, -3.545008659362793, -3.212968349456787, -2.880927801132202, -2.548887014389038, -2.216846466064453, -1.8848057985305786, -1.552765130996704, -1.2207245826721191, -0.8886837959289551, -0.5566432476043701, -0.224602609872818, 0.10743802785873413, 0.43947863578796387, 0.7715193033218384, 1.103559970855713, 1.4356005191802979, 1.767641305923462, 2.099681854248047, 2.431722402572632, 2.763763189315796, 3.095803737640381, 3.427844524383545, 3.75988507270813, 4.091925621032715, 4.423966407775879, 4.756007194519043, 5.088047981262207, 5.420088291168213, 5.752129077911377, 6.084169864654541, 6.416210174560547, 6.748250961303711, 7.080291748046875, 7.412332057952881, 7.744372844696045, 8.07641315460205, 8.408453941345215, 8.740494728088379, 9.072535514831543, 9.40457534790039, 9.736616134643555, 10.068656921386719, 10.400697708129883, 10.732738494873047, 11.064779281616211, 11.396819114685059, 11.728859901428223, 12.060900688171387, 12.39294147491455, 12.724982261657715]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 3.0, 8.0, 6.0, 15.0, 14.0, 25.0, 34.0, 30.0, 30.0, 26.0, 49.0, 59.0, 54.0, 61.0, 50.0, 50.0, 66.0, 59.0, 67.0, 46.0, 40.0, 32.0, 33.0, 27.0, 21.0, 26.0, 26.0, 15.0, 7.0, 8.0, 4.0, 4.0, 4.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.25840950012207, -5.129344463348389, -5.000279426574707, -4.871213912963867, -4.7421488761901855, -4.613083839416504, -4.484018802642822, -4.354953765869141, -4.225888252258301, -4.096823215484619, -3.9677579402923584, -3.8386929035186768, -3.709627628326416, -3.5805625915527344, -3.4514975547790527, -3.322432518005371, -3.1933674812316895, -3.064302444458008, -2.935237169265747, -2.8061721324920654, -2.6771068572998047, -2.548041820526123, -2.4189767837524414, -2.2899117469787598, -2.160846471786499, -2.0317814350128174, -1.9027161598205566, -1.773651123046875, -1.6445859670639038, -1.5155208110809326, -1.386455774307251, -1.2573906183242798, -1.1283249855041504, -0.9992598295211792, -0.8701947331428528, -0.7411296367645264, -0.6120644807815552, -0.482999324798584, -0.35393422842025757, -0.22486913204193115, -0.09580397605895996, 0.03326115012168884, 0.16232627630233765, 0.29139140248298645, 0.42045652866363525, 0.5495216846466064, 0.6785867810249329, 0.8076518774032593, 0.9367170333862305, 1.0657821893692017, 1.1948473453521729, 1.3239123821258545, 1.4529775381088257, 1.5820426940917969, 1.7111077308654785, 1.8401728868484497, 1.969238042831421, 2.0983030796051025, 2.2273683547973633, 2.356433391571045, 2.4854984283447266, 2.6145637035369873, 2.743628740310669, 2.8726940155029297, 3.0017590522766113]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 9.0, 17.0, 12.0, 14.0, 17.0, 37.0, 32.0, 44.0, 69.0, 104.0, 182.0, 266.0, 492.0, 905.0, 1884.0, 4420.0, 12174.0, 40160.0, 165897.0, 505071.0, 236060.0, 54818.0, 15531.0, 5562.0, 2324.0, 1087.0, 538.0, 273.0, 176.0, 107.0, 66.0, 56.0, 35.0, 24.0, 21.0, 18.0, 11.0, 6.0, 5.0, 12.0, 2.0, 0.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.408203125, -2.33203125, -2.255859375, -2.1796875, -2.103515625, -2.02734375, -1.951171875, -1.875, -1.798828125, -1.72265625, -1.646484375, -1.5703125, -1.494140625, -1.41796875, -1.341796875, -1.265625, -1.189453125, -1.11328125, -1.037109375, -0.9609375, -0.884765625, -0.80859375, -0.732421875, -0.65625, -0.580078125, -0.50390625, -0.427734375, -0.3515625, -0.275390625, -0.19921875, -0.123046875, -0.046875, 0.029296875, 0.10546875, 0.181640625, 0.2578125, 0.333984375, 0.41015625, 0.486328125, 0.5625, 0.638671875, 0.71484375, 0.791015625, 0.8671875, 0.943359375, 1.01953125, 1.095703125, 1.171875, 1.248046875, 1.32421875, 1.400390625, 1.4765625, 1.552734375, 1.62890625, 1.705078125, 1.78125, 1.857421875, 1.93359375, 2.009765625, 2.0859375, 2.162109375, 2.23828125, 2.314453125, 2.390625, 2.466796875]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 4.0, 6.0, 4.0, 8.0, 12.0, 20.0, 20.0, 37.0, 49.0, 73.0, 85.0, 86.0, 98.0, 94.0, 92.0, 71.0, 66.0, 55.0, 40.0, 30.0, 14.0, 13.0, 8.0, 7.0, 8.0, 2.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5230331420898438, -0.4957733154296875, -0.46851348876953125, -0.441253662109375, -0.41399383544921875, -0.3867340087890625, -0.35947418212890625, -0.33221435546875, -0.30495452880859375, -0.2776947021484375, -0.25043487548828125, -0.223175048828125, -0.19591522216796875, -0.1686553955078125, -0.14139556884765625, -0.1141357421875, -0.08687591552734375, -0.0596160888671875, -0.03235626220703125, -0.005096435546875, 0.02216339111328125, 0.0494232177734375, 0.07668304443359375, 0.10394287109375, 0.13120269775390625, 0.1584625244140625, 0.18572235107421875, 0.212982177734375, 0.24024200439453125, 0.2675018310546875, 0.29476165771484375, 0.322021484375, 0.34928131103515625, 0.3765411376953125, 0.40380096435546875, 0.431060791015625, 0.45832061767578125, 0.4855804443359375, 0.5128402709960938, 0.54010009765625, 0.5673599243164062, 0.5946197509765625, 0.6218795776367188, 0.649139404296875, 0.6763992309570312, 0.7036590576171875, 0.7309188842773438, 0.7581787109375, 0.7854385375976562, 0.8126983642578125, 0.8399581909179688, 0.867218017578125, 0.8944778442382812, 0.9217376708984375, 0.9489974975585938, 0.97625732421875, 1.0035171508789062, 1.0307769775390625, 1.0580368041992188, 1.085296630859375, 1.1125564575195312, 1.1398162841796875, 1.1670761108398438, 1.1943359375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 8.0, 10.0, 13.0, 17.0, 15.0, 12.0, 28.0, 35.0, 82.0, 98.0, 138.0, 207.0, 400.0, 691.0, 1314.0, 2845.0, 7230.0, 22348.0, 86276.0, 360874.0, 417000.0, 106961.0, 26881.0, 8416.0, 3319.0, 1424.0, 757.0, 411.0, 226.0, 176.0, 82.0, 72.0, 52.0, 39.0, 27.0, 19.0, 11.0, 13.0, 9.0, 4.0, 1.0, 6.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.1796875, -2.107208251953125, -2.03472900390625, -1.962249755859375, -1.8897705078125, -1.817291259765625, -1.74481201171875, -1.672332763671875, -1.599853515625, -1.527374267578125, -1.45489501953125, -1.382415771484375, -1.3099365234375, -1.237457275390625, -1.16497802734375, -1.092498779296875, -1.02001953125, -0.947540283203125, -0.87506103515625, -0.802581787109375, -0.7301025390625, -0.657623291015625, -0.58514404296875, -0.512664794921875, -0.440185546875, -0.367706298828125, -0.29522705078125, -0.222747802734375, -0.1502685546875, -0.077789306640625, -0.00531005859375, 0.067169189453125, 0.1396484375, 0.212127685546875, 0.28460693359375, 0.357086181640625, 0.4295654296875, 0.502044677734375, 0.57452392578125, 0.647003173828125, 0.719482421875, 0.791961669921875, 0.86444091796875, 0.936920166015625, 1.0093994140625, 1.081878662109375, 1.15435791015625, 1.226837158203125, 1.29931640625, 1.371795654296875, 1.44427490234375, 1.516754150390625, 1.5892333984375, 1.661712646484375, 1.73419189453125, 1.806671142578125, 1.879150390625, 1.951629638671875, 2.02410888671875, 2.096588134765625, 2.1690673828125, 2.241546630859375, 2.31402587890625, 2.386505126953125, 2.458984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 5.0, 13.0, 6.0, 14.0, 15.0, 16.0, 22.0, 32.0, 31.0, 37.0, 33.0, 43.0, 49.0, 42.0, 59.0, 56.0, 52.0, 43.0, 51.0, 55.0, 48.0, 48.0, 37.0, 33.0, 26.0, 27.0, 13.0, 13.0, 16.0, 21.0, 8.0, 6.0, 10.0, 4.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.58984375, -2.505096435546875, -2.42034912109375, -2.335601806640625, -2.2508544921875, -2.166107177734375, -2.08135986328125, -1.996612548828125, -1.911865234375, -1.827117919921875, -1.74237060546875, -1.657623291015625, -1.5728759765625, -1.488128662109375, -1.40338134765625, -1.318634033203125, -1.23388671875, -1.149139404296875, -1.06439208984375, -0.979644775390625, -0.8948974609375, -0.810150146484375, -0.72540283203125, -0.640655517578125, -0.555908203125, -0.471160888671875, -0.38641357421875, -0.301666259765625, -0.2169189453125, -0.132171630859375, -0.04742431640625, 0.037322998046875, 0.1220703125, 0.206817626953125, 0.29156494140625, 0.376312255859375, 0.4610595703125, 0.545806884765625, 0.63055419921875, 0.715301513671875, 0.800048828125, 0.884796142578125, 0.96954345703125, 1.054290771484375, 1.1390380859375, 1.223785400390625, 1.30853271484375, 1.393280029296875, 1.47802734375, 1.562774658203125, 1.64752197265625, 1.732269287109375, 1.8170166015625, 1.901763916015625, 1.98651123046875, 2.071258544921875, 2.156005859375, 2.240753173828125, 2.32550048828125, 2.410247802734375, 2.4949951171875, 2.579742431640625, 2.66448974609375, 2.749237060546875, 2.833984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 5.0, 18.0, 12.0, 19.0, 25.0, 68.0, 88.0, 156.0, 237.0, 513.0, 1078.0, 2828.0, 10415.0, 49906.0, 306473.0, 538551.0, 110456.0, 19504.0, 5001.0, 1656.0, 690.0, 343.0, 187.0, 107.0, 66.0, 51.0, 30.0, 22.0, 9.0, 12.0, 4.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75830078125, -0.7314300537109375, -0.704559326171875, -0.6776885986328125, -0.65081787109375, -0.6239471435546875, -0.597076416015625, -0.5702056884765625, -0.5433349609375, -0.5164642333984375, -0.489593505859375, -0.4627227783203125, -0.43585205078125, -0.4089813232421875, -0.382110595703125, -0.3552398681640625, -0.328369140625, -0.3014984130859375, -0.274627685546875, -0.2477569580078125, -0.22088623046875, -0.1940155029296875, -0.167144775390625, -0.1402740478515625, -0.1134033203125, -0.0865325927734375, -0.059661865234375, -0.0327911376953125, -0.00592041015625, 0.0209503173828125, 0.047821044921875, 0.0746917724609375, 0.1015625, 0.1284332275390625, 0.155303955078125, 0.1821746826171875, 0.20904541015625, 0.2359161376953125, 0.262786865234375, 0.2896575927734375, 0.3165283203125, 0.3433990478515625, 0.370269775390625, 0.3971405029296875, 0.42401123046875, 0.4508819580078125, 0.477752685546875, 0.5046234130859375, 0.531494140625, 0.5583648681640625, 0.585235595703125, 0.6121063232421875, 0.63897705078125, 0.6658477783203125, 0.692718505859375, 0.7195892333984375, 0.7464599609375, 0.7733306884765625, 0.800201416015625, 0.8270721435546875, 0.85394287109375, 0.8808135986328125, 0.907684326171875, 0.9345550537109375, 0.96142578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 5.0, 8.0, 7.0, 6.0, 9.0, 15.0, 15.0, 23.0, 30.0, 20.0, 42.0, 49.0, 55.0, 70.0, 93.0, 94.0, 88.0, 61.0, 59.0, 42.0, 51.0, 27.0, 25.0, 21.0, 17.0, 17.0, 10.0, 12.0, 11.0, 2.0, 4.0, 7.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00015211105346679688, -0.00014795362949371338, -0.00014379620552062988, -0.0001396387815475464, -0.0001354813575744629, -0.0001313239336013794, -0.0001271665096282959, -0.0001230090856552124, -0.0001188516616821289, -0.00011469423770904541, -0.00011053681373596191, -0.00010637938976287842, -0.00010222196578979492, -9.806454181671143e-05, -9.390711784362793e-05, -8.974969387054443e-05, -8.559226989746094e-05, -8.143484592437744e-05, -7.727742195129395e-05, -7.311999797821045e-05, -6.896257400512695e-05, -6.480515003204346e-05, -6.064772605895996e-05, -5.6490302085876465e-05, -5.233287811279297e-05, -4.817545413970947e-05, -4.4018030166625977e-05, -3.986060619354248e-05, -3.5703182220458984e-05, -3.154575824737549e-05, -2.7388334274291992e-05, -2.3230910301208496e-05, -1.9073486328125e-05, -1.4916062355041504e-05, -1.0758638381958008e-05, -6.601214408874512e-06, -2.4437904357910156e-06, 1.7136335372924805e-06, 5.8710575103759766e-06, 1.0028481483459473e-05, 1.4185905456542969e-05, 1.8343329429626465e-05, 2.250075340270996e-05, 2.6658177375793457e-05, 3.081560134887695e-05, 3.497302532196045e-05, 3.9130449295043945e-05, 4.328787326812744e-05, 4.744529724121094e-05, 5.1602721214294434e-05, 5.576014518737793e-05, 5.9917569160461426e-05, 6.407499313354492e-05, 6.823241710662842e-05, 7.238984107971191e-05, 7.654726505279541e-05, 8.07046890258789e-05, 8.48621129989624e-05, 8.90195369720459e-05, 9.31769609451294e-05, 9.733438491821289e-05, 0.00010149180889129639, 0.00010564923286437988, 0.00010980665683746338, 0.00011396408081054688]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 6.0, 2.0, 6.0, 7.0, 7.0, 8.0, 27.0, 35.0, 65.0, 72.0, 121.0, 193.0, 332.0, 631.0, 1325.0, 3451.0, 11149.0, 53640.0, 351342.0, 516167.0, 85875.0, 16188.0, 4451.0, 1615.0, 827.0, 384.0, 231.0, 139.0, 84.0, 63.0, 35.0, 23.0, 18.0, 10.0, 12.0, 3.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.97021484375, -0.9400177001953125, -0.909820556640625, -0.8796234130859375, -0.84942626953125, -0.8192291259765625, -0.789031982421875, -0.7588348388671875, -0.7286376953125, -0.6984405517578125, -0.668243408203125, -0.6380462646484375, -0.60784912109375, -0.5776519775390625, -0.547454833984375, -0.5172576904296875, -0.487060546875, -0.4568634033203125, -0.426666259765625, -0.3964691162109375, -0.36627197265625, -0.3360748291015625, -0.305877685546875, -0.2756805419921875, -0.2454833984375, -0.2152862548828125, -0.185089111328125, -0.1548919677734375, -0.12469482421875, -0.0944976806640625, -0.064300537109375, -0.0341033935546875, -0.00390625, 0.0262908935546875, 0.056488037109375, 0.0866851806640625, 0.11688232421875, 0.1470794677734375, 0.177276611328125, 0.2074737548828125, 0.2376708984375, 0.2678680419921875, 0.298065185546875, 0.3282623291015625, 0.35845947265625, 0.3886566162109375, 0.418853759765625, 0.4490509033203125, 0.479248046875, 0.5094451904296875, 0.539642333984375, 0.5698394775390625, 0.60003662109375, 0.6302337646484375, 0.660430908203125, 0.6906280517578125, 0.7208251953125, 0.7510223388671875, 0.781219482421875, 0.8114166259765625, 0.84161376953125, 0.8718109130859375, 0.902008056640625, 0.9322052001953125, 0.96240234375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 6.0, 2.0, 8.0, 8.0, 14.0, 11.0, 19.0, 45.0, 64.0, 86.0, 102.0, 139.0, 136.0, 100.0, 79.0, 61.0, 39.0, 23.0, 21.0, 18.0, 6.0, 4.0, 4.0, 6.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92236328125, -0.8926773071289062, -0.8629913330078125, -0.8333053588867188, -0.803619384765625, -0.7739334106445312, -0.7442474365234375, -0.7145614624023438, -0.68487548828125, -0.6551895141601562, -0.6255035400390625, -0.5958175659179688, -0.566131591796875, -0.5364456176757812, -0.5067596435546875, -0.47707366943359375, -0.4473876953125, -0.41770172119140625, -0.3880157470703125, -0.35832977294921875, -0.328643798828125, -0.29895782470703125, -0.2692718505859375, -0.23958587646484375, -0.20989990234375, -0.18021392822265625, -0.1505279541015625, -0.12084197998046875, -0.091156005859375, -0.06147003173828125, -0.0317840576171875, -0.00209808349609375, 0.027587890625, 0.05727386474609375, 0.0869598388671875, 0.11664581298828125, 0.146331787109375, 0.17601776123046875, 0.2057037353515625, 0.23538970947265625, 0.26507568359375, 0.29476165771484375, 0.3244476318359375, 0.35413360595703125, 0.383819580078125, 0.41350555419921875, 0.4431915283203125, 0.47287750244140625, 0.5025634765625, 0.5322494506835938, 0.5619354248046875, 0.5916213989257812, 0.621307373046875, 0.6509933471679688, 0.6806793212890625, 0.7103652954101562, 0.74005126953125, 0.7697372436523438, 0.7994232177734375, 0.8291091918945312, 0.858795166015625, 0.8884811401367188, 0.9181671142578125, 0.9478530883789062, 0.9775390625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 18.0, 17.0, 42.0, 97.0, 210.0, 258.0, 190.0, 84.0, 37.0, 19.0, 15.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.7354097366333, -8.025243759155273, -7.315077304840088, -6.604910850524902, -5.894744873046875, -5.1845784187316895, -4.474411964416504, -3.7642459869384766, -3.054079532623291, -2.3439133167266846, -1.6337469816207886, -0.9235806465148926, -0.21341443061828613, 0.4967517852783203, 1.2069182395935059, 1.9170842170715332, 2.6272506713867188, 3.337416887283325, 4.047583103179932, 4.757749557495117, 5.4679155349731445, 6.17808198928833, 6.888248443603516, 7.598414421081543, 8.30858039855957, 9.018746376037598, 9.728913307189941, 10.439079284667969, 11.149245262145996, 11.859411239624023, 12.569578170776367, 13.279744148254395, 13.989912033081055, 14.700078010559082, 15.410244941711426, 16.120410919189453, 16.830577850341797, 17.540742874145508, 18.25090980529785, 18.961074829101562, 19.671241760253906, 20.38140869140625, 21.09157371520996, 21.801740646362305, 22.51190757751465, 23.22207260131836, 23.932239532470703, 24.642406463623047, 25.35257339477539, 26.062740325927734, 26.772905349731445, 27.48307228088379, 28.193239212036133, 28.903404235839844, 29.613571166992188, 30.32373809814453, 31.033903121948242, 31.744070053100586, 32.4542350769043, 33.16440200805664, 33.874568939208984, 34.58473587036133, 35.294898986816406, 36.00506591796875, 36.715232849121094]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 6.0, 8.0, 8.0, 11.0, 14.0, 18.0, 22.0, 17.0, 26.0, 40.0, 36.0, 40.0, 37.0, 43.0, 54.0, 46.0, 67.0, 49.0, 51.0, 58.0, 32.0, 44.0, 33.0, 37.0, 38.0, 25.0, 21.0, 18.0, 27.0, 16.0, 12.0, 8.0, 10.0, 10.0, 6.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.277040481567383, -14.789501190185547, -14.301960945129395, -13.814421653747559, -13.326882362365723, -12.83934211730957, -12.351802825927734, -11.864263534545898, -11.376724243164062, -10.889184951782227, -10.401644706726074, -9.914105415344238, -9.426566123962402, -8.93902587890625, -8.451486587524414, -7.963947296142578, -7.476407051086426, -6.988867282867432, -6.501327991485596, -6.013788223266602, -5.526248931884766, -5.0387091636657715, -4.551169395446777, -4.063630104064941, -3.5760903358459473, -3.0885508060455322, -2.601011276245117, -2.113471508026123, -1.625931978225708, -1.138392448425293, -0.6508526802062988, -0.1633131504058838, 0.32422637939453125, 0.8117659687995911, 1.2993055582046509, 1.7868452072143555, 2.2743847370147705, 2.7619242668151855, 3.2494640350341797, 3.7370035648345947, 4.22454309463501, 4.712082862854004, 5.19962215423584, 5.687161922454834, 6.174701690673828, 6.662240982055664, 7.149780750274658, 7.637320518493652, 8.124859809875488, 8.612399101257324, 9.099939346313477, 9.587478637695312, 10.075017929077148, 10.562557220458984, 11.050097465515137, 11.537636756896973, 12.025177001953125, 12.512716293334961, 13.000256538391113, 13.48779582977295, 13.975335121154785, 14.462875366210938, 14.950414657592773, 15.43795394897461, 15.925493240356445]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 13.0, 30.0, 37.0, 78.0, 152.0, 248.0, 471.0, 1004.0, 2295.0, 5781.0, 17387.0, 78353.0, 3642020.0, 390962.0, 36543.0, 10546.0, 4050.0, 1855.0, 878.0, 546.0, 320.0, 194.0, 141.0, 91.0, 59.0, 47.0, 34.0, 28.0, 27.0, 19.0, 5.0, 14.0, 10.0, 5.0, 4.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.755859375, -1.67138671875, -1.5869140625, -1.50244140625, -1.41796875, -1.33349609375, -1.2490234375, -1.16455078125, -1.080078125, -0.99560546875, -0.9111328125, -0.82666015625, -0.7421875, -0.65771484375, -0.5732421875, -0.48876953125, -0.404296875, -0.31982421875, -0.2353515625, -0.15087890625, -0.06640625, 0.01806640625, 0.1025390625, 0.18701171875, 0.271484375, 0.35595703125, 0.4404296875, 0.52490234375, 0.609375, 0.69384765625, 0.7783203125, 0.86279296875, 0.947265625, 1.03173828125, 1.1162109375, 1.20068359375, 1.28515625, 1.36962890625, 1.4541015625, 1.53857421875, 1.623046875, 1.70751953125, 1.7919921875, 1.87646484375, 1.9609375, 2.04541015625, 2.1298828125, 2.21435546875, 2.298828125, 2.38330078125, 2.4677734375, 2.55224609375, 2.63671875, 2.72119140625, 2.8056640625, 2.89013671875, 2.974609375, 3.05908203125, 3.1435546875, 3.22802734375, 3.3125, 3.39697265625, 3.4814453125, 3.56591796875, 3.650390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 0.0, 1.0, 6.0, 3.0, 7.0, 11.0, 9.0, 19.0, 24.0, 33.0, 41.0, 61.0, 62.0, 77.0, 100.0, 85.0, 78.0, 82.0, 54.0, 65.0, 54.0, 37.0, 30.0, 15.0, 23.0, 12.0, 6.0, 5.0, 4.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50390625, -0.4771728515625, -0.450439453125, -0.4237060546875, -0.39697265625, -0.3702392578125, -0.343505859375, -0.3167724609375, -0.2900390625, -0.2633056640625, -0.236572265625, -0.2098388671875, -0.18310546875, -0.1563720703125, -0.129638671875, -0.1029052734375, -0.076171875, -0.0494384765625, -0.022705078125, 0.0040283203125, 0.03076171875, 0.0574951171875, 0.084228515625, 0.1109619140625, 0.1376953125, 0.1644287109375, 0.191162109375, 0.2178955078125, 0.24462890625, 0.2713623046875, 0.298095703125, 0.3248291015625, 0.3515625, 0.3782958984375, 0.405029296875, 0.4317626953125, 0.45849609375, 0.4852294921875, 0.511962890625, 0.5386962890625, 0.5654296875, 0.5921630859375, 0.618896484375, 0.6456298828125, 0.67236328125, 0.6990966796875, 0.725830078125, 0.7525634765625, 0.779296875, 0.8060302734375, 0.832763671875, 0.8594970703125, 0.88623046875, 0.9129638671875, 0.939697265625, 0.9664306640625, 0.9931640625, 1.0198974609375, 1.046630859375, 1.0733642578125, 1.10009765625, 1.1268310546875, 1.153564453125, 1.1802978515625, 1.20703125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 6.0, 3.0, 2.0, 8.0, 10.0, 14.0, 24.0, 38.0, 65.0, 74.0, 168.0, 280.0, 550.0, 1210.0, 3182.0, 10659.0, 50928.0, 1925673.0, 2136320.0, 49685.0, 9949.0, 2946.0, 1207.0, 510.0, 271.0, 170.0, 118.0, 80.0, 35.0, 33.0, 21.0, 17.0, 10.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2421875, -2.164886474609375, -2.08758544921875, -2.010284423828125, -1.9329833984375, -1.855682373046875, -1.77838134765625, -1.701080322265625, -1.623779296875, -1.546478271484375, -1.46917724609375, -1.391876220703125, -1.3145751953125, -1.237274169921875, -1.15997314453125, -1.082672119140625, -1.00537109375, -0.928070068359375, -0.85076904296875, -0.773468017578125, -0.6961669921875, -0.618865966796875, -0.54156494140625, -0.464263916015625, -0.386962890625, -0.309661865234375, -0.23236083984375, -0.155059814453125, -0.0777587890625, -0.000457763671875, 0.07684326171875, 0.154144287109375, 0.2314453125, 0.308746337890625, 0.38604736328125, 0.463348388671875, 0.5406494140625, 0.617950439453125, 0.69525146484375, 0.772552490234375, 0.849853515625, 0.927154541015625, 1.00445556640625, 1.081756591796875, 1.1590576171875, 1.236358642578125, 1.31365966796875, 1.390960693359375, 1.46826171875, 1.545562744140625, 1.62286376953125, 1.700164794921875, 1.7774658203125, 1.854766845703125, 1.93206787109375, 2.009368896484375, 2.086669921875, 2.163970947265625, 2.24127197265625, 2.318572998046875, 2.3958740234375, 2.473175048828125, 2.55047607421875, 2.627777099609375, 2.705078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 3.0, 4.0, 6.0, 10.0, 7.0, 8.0, 18.0, 15.0, 40.0, 38.0, 71.0, 127.0, 281.0, 948.0, 1670.0, 414.0, 192.0, 86.0, 52.0, 30.0, 18.0, 11.0, 6.0, 6.0, 5.0, 5.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7460708618164062, -0.7235870361328125, -0.7011032104492188, -0.678619384765625, -0.6561355590820312, -0.6336517333984375, -0.6111679077148438, -0.58868408203125, -0.5662002563476562, -0.5437164306640625, -0.5212326049804688, -0.498748779296875, -0.47626495361328125, -0.4537811279296875, -0.43129730224609375, -0.4088134765625, -0.38632965087890625, -0.3638458251953125, -0.34136199951171875, -0.318878173828125, -0.29639434814453125, -0.2739105224609375, -0.25142669677734375, -0.22894287109375, -0.20645904541015625, -0.1839752197265625, -0.16149139404296875, -0.139007568359375, -0.11652374267578125, -0.0940399169921875, -0.07155609130859375, -0.049072265625, -0.02658843994140625, -0.0041046142578125, 0.01837921142578125, 0.040863037109375, 0.06334686279296875, 0.0858306884765625, 0.10831451416015625, 0.13079833984375, 0.15328216552734375, 0.1757659912109375, 0.19824981689453125, 0.220733642578125, 0.24321746826171875, 0.2657012939453125, 0.28818511962890625, 0.3106689453125, 0.33315277099609375, 0.3556365966796875, 0.37812042236328125, 0.400604248046875, 0.42308807373046875, 0.4455718994140625, 0.46805572509765625, 0.49053955078125, 0.5130233764648438, 0.5355072021484375, 0.5579910278320312, 0.580474853515625, 0.6029586791992188, 0.6254425048828125, 0.6479263305664062, 0.67041015625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 42.0, 143.0, 331.0, 321.0, 107.0, 38.0, 9.0, 0.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-11.956747055053711, -11.722601890563965, -11.488455772399902, -11.254310607910156, -11.020164489746094, -10.786019325256348, -10.551874160766602, -10.317728042602539, -10.083582878112793, -9.849437713623047, -9.615291595458984, -9.381146430969238, -9.147000312805176, -8.91285514831543, -8.678709983825684, -8.444563865661621, -8.210418701171875, -7.976273059844971, -7.742127418518066, -7.50798225402832, -7.273836612701416, -7.039690971374512, -6.805545330047607, -6.571399688720703, -6.337254047393799, -6.1031084060668945, -5.86896276473999, -5.634817600250244, -5.40067195892334, -5.1665263175964355, -4.932380676269531, -4.698235511779785, -4.464090347290039, -4.229944705963135, -3.9957993030548096, -3.7616536617279053, -3.52750825881958, -3.293362617492676, -3.0592169761657715, -2.8250715732574463, -2.590925693511963, -2.3567800521850586, -2.1226346492767334, -1.888489007949829, -1.654343605041504, -1.4201979637145996, -1.1860524415969849, -0.9519069194793701, -0.7177615165710449, -0.4836159944534302, -0.24947044253349304, -0.015324890613555908, 0.21882063150405884, 0.45296621322631836, 0.6871117353439331, 0.9212572574615479, 1.1554027795791626, 1.3895483016967773, 1.623693823814392, 1.8578393459320068, 2.091984987258911, 2.3261303901672363, 2.5602760314941406, 2.794421672821045, 3.02856707572937]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 11.0, 11.0, 8.0, 10.0, 16.0, 16.0, 17.0, 29.0, 25.0, 19.0, 34.0, 31.0, 33.0, 34.0, 52.0, 50.0, 52.0, 50.0, 48.0, 43.0, 43.0, 48.0, 46.0, 36.0, 37.0, 38.0, 35.0, 26.0, 16.0, 22.0, 12.0, 7.0, 13.0, 7.0, 10.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.4083962440490723, -2.3434433937072754, -2.2784907817840576, -2.2135379314422607, -2.148585081100464, -2.083632469177246, -2.018679618835449, -1.9537267684936523, -1.888774037361145, -1.8238213062286377, -1.7588684558868408, -1.6939157247543335, -1.6289629936218262, -1.5640101432800293, -1.499057412147522, -1.4341046810150146, -1.3691518306732178, -1.3041990995407104, -1.2392462491989136, -1.1742935180664062, -1.1093406677246094, -1.044387936592102, -0.9794352054595947, -0.9144824147224426, -0.8495296239852905, -0.7845768332481384, -0.7196240425109863, -0.654671311378479, -0.5897185206413269, -0.5247657299041748, -0.4598129689693451, -0.3948602080345154, -0.3299071788787842, -0.2649543881416321, -0.20000162720680237, -0.13504885137081146, -0.07009607553482056, -0.005143284797668457, 0.059809476137161255, 0.12476223707199097, 0.18971502780914307, 0.25466781854629517, 0.3196205794811249, 0.3845733404159546, 0.4495261311531067, 0.5144789218902588, 0.5794316530227661, 0.6443844437599182, 0.7093372344970703, 0.7742900252342224, 0.8392428159713745, 0.9041955471038818, 0.9691483378410339, 1.034101128578186, 1.0990538597106934, 1.1640067100524902, 1.2289594411849976, 1.2939121723175049, 1.3588650226593018, 1.423817753791809, 1.4887704849243164, 1.5537233352661133, 1.6186760663986206, 1.683628797531128, 1.7485816478729248]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 7.0, 6.0, 16.0, 14.0, 35.0, 33.0, 45.0, 56.0, 108.0, 167.0, 262.0, 525.0, 1115.0, 2543.0, 6884.0, 22222.0, 91198.0, 430636.0, 383873.0, 78284.0, 19767.0, 6146.0, 2322.0, 1076.0, 457.0, 270.0, 165.0, 90.0, 78.0, 42.0, 26.0, 25.0, 11.0, 14.0, 10.0, 7.0, 9.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.177734375, -2.099822998046875, -2.02191162109375, -1.944000244140625, -1.8660888671875, -1.788177490234375, -1.71026611328125, -1.632354736328125, -1.554443359375, -1.476531982421875, -1.39862060546875, -1.320709228515625, -1.2427978515625, -1.164886474609375, -1.08697509765625, -1.009063720703125, -0.93115234375, -0.853240966796875, -0.77532958984375, -0.697418212890625, -0.6195068359375, -0.541595458984375, -0.46368408203125, -0.385772705078125, -0.307861328125, -0.229949951171875, -0.15203857421875, -0.074127197265625, 0.0037841796875, 0.081695556640625, 0.15960693359375, 0.237518310546875, 0.3154296875, 0.393341064453125, 0.47125244140625, 0.549163818359375, 0.6270751953125, 0.704986572265625, 0.78289794921875, 0.860809326171875, 0.938720703125, 1.016632080078125, 1.09454345703125, 1.172454833984375, 1.2503662109375, 1.328277587890625, 1.40618896484375, 1.484100341796875, 1.56201171875, 1.639923095703125, 1.71783447265625, 1.795745849609375, 1.8736572265625, 1.951568603515625, 2.02947998046875, 2.107391357421875, 2.185302734375, 2.263214111328125, 2.34112548828125, 2.419036865234375, 2.4969482421875, 2.574859619140625, 2.65277099609375, 2.730682373046875, 2.80859375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 3.0, 5.0, 14.0, 13.0, 25.0, 29.0, 38.0, 57.0, 54.0, 77.0, 100.0, 88.0, 87.0, 76.0, 59.0, 64.0, 56.0, 43.0, 37.0, 22.0, 20.0, 12.0, 5.0, 6.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.51318359375, -0.48638153076171875, -0.4595794677734375, -0.43277740478515625, -0.405975341796875, -0.37917327880859375, -0.3523712158203125, -0.32556915283203125, -0.29876708984375, -0.27196502685546875, -0.2451629638671875, -0.21836090087890625, -0.191558837890625, -0.16475677490234375, -0.1379547119140625, -0.11115264892578125, -0.0843505859375, -0.05754852294921875, -0.0307464599609375, -0.00394439697265625, 0.022857666015625, 0.04965972900390625, 0.0764617919921875, 0.10326385498046875, 0.13006591796875, 0.15686798095703125, 0.1836700439453125, 0.21047210693359375, 0.237274169921875, 0.26407623291015625, 0.2908782958984375, 0.31768035888671875, 0.344482421875, 0.37128448486328125, 0.3980865478515625, 0.42488861083984375, 0.451690673828125, 0.47849273681640625, 0.5052947998046875, 0.5320968627929688, 0.55889892578125, 0.5857009887695312, 0.6125030517578125, 0.6393051147460938, 0.666107177734375, 0.6929092407226562, 0.7197113037109375, 0.7465133666992188, 0.7733154296875, 0.8001174926757812, 0.8269195556640625, 0.8537216186523438, 0.880523681640625, 0.9073257446289062, 0.9341278076171875, 0.9609298706054688, 0.98773193359375, 1.0145339965820312, 1.0413360595703125, 1.0681381225585938, 1.094940185546875, 1.1217422485351562, 1.1485443115234375, 1.1753463745117188, 1.2021484375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 6.0, 1.0, 3.0, 2.0, 10.0, 13.0, 13.0, 6.0, 25.0, 22.0, 41.0, 50.0, 53.0, 95.0, 142.0, 217.0, 330.0, 482.0, 960.0, 1842.0, 3935.0, 9880.0, 29705.0, 109836.0, 394609.0, 358288.0, 95093.0, 26126.0, 9024.0, 3714.0, 1616.0, 906.0, 508.0, 291.0, 218.0, 137.0, 104.0, 68.0, 56.0, 37.0, 24.0, 19.0, 17.0, 8.0, 4.0, 6.0, 7.0, 5.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.6943359375, -1.6337127685546875, -1.573089599609375, -1.5124664306640625, -1.45184326171875, -1.3912200927734375, -1.330596923828125, -1.2699737548828125, -1.2093505859375, -1.1487274169921875, -1.088104248046875, -1.0274810791015625, -0.96685791015625, -0.9062347412109375, -0.845611572265625, -0.7849884033203125, -0.724365234375, -0.6637420654296875, -0.603118896484375, -0.5424957275390625, -0.48187255859375, -0.4212493896484375, -0.360626220703125, -0.3000030517578125, -0.2393798828125, -0.1787567138671875, -0.118133544921875, -0.0575103759765625, 0.00311279296875, 0.0637359619140625, 0.124359130859375, 0.1849822998046875, 0.24560546875, 0.3062286376953125, 0.366851806640625, 0.4274749755859375, 0.48809814453125, 0.5487213134765625, 0.609344482421875, 0.6699676513671875, 0.7305908203125, 0.7912139892578125, 0.851837158203125, 0.9124603271484375, 0.97308349609375, 1.0337066650390625, 1.094329833984375, 1.1549530029296875, 1.215576171875, 1.2761993408203125, 1.336822509765625, 1.3974456787109375, 1.45806884765625, 1.5186920166015625, 1.579315185546875, 1.6399383544921875, 1.7005615234375, 1.7611846923828125, 1.821807861328125, 1.8824310302734375, 1.94305419921875, 2.0036773681640625, 2.064300537109375, 2.1249237060546875, 2.185546875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 7.0, 6.0, 6.0, 5.0, 18.0, 15.0, 21.0, 20.0, 28.0, 32.0, 31.0, 52.0, 45.0, 51.0, 51.0, 71.0, 50.0, 47.0, 49.0, 42.0, 46.0, 33.0, 40.0, 34.0, 31.0, 30.0, 31.0, 21.0, 15.0, 15.0, 10.0, 8.0, 13.0, 8.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16796875, -2.08709716796875, -2.0062255859375, -1.92535400390625, -1.844482421875, -1.76361083984375, -1.6827392578125, -1.60186767578125, -1.52099609375, -1.44012451171875, -1.3592529296875, -1.27838134765625, -1.197509765625, -1.11663818359375, -1.0357666015625, -0.95489501953125, -0.8740234375, -0.79315185546875, -0.7122802734375, -0.63140869140625, -0.550537109375, -0.46966552734375, -0.3887939453125, -0.30792236328125, -0.22705078125, -0.14617919921875, -0.0653076171875, 0.01556396484375, 0.096435546875, 0.17730712890625, 0.2581787109375, 0.33905029296875, 0.419921875, 0.50079345703125, 0.5816650390625, 0.66253662109375, 0.743408203125, 0.82427978515625, 0.9051513671875, 0.98602294921875, 1.06689453125, 1.14776611328125, 1.2286376953125, 1.30950927734375, 1.390380859375, 1.47125244140625, 1.5521240234375, 1.63299560546875, 1.7138671875, 1.79473876953125, 1.8756103515625, 1.95648193359375, 2.037353515625, 2.11822509765625, 2.1990966796875, 2.27996826171875, 2.36083984375, 2.44171142578125, 2.5225830078125, 2.60345458984375, 2.684326171875, 2.76519775390625, 2.8460693359375, 2.92694091796875, 3.0078125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 9.0, 17.0, 28.0, 31.0, 47.0, 71.0, 145.0, 290.0, 715.0, 2252.0, 9722.0, 66235.0, 524935.0, 388703.0, 45259.0, 7049.0, 1773.0, 612.0, 283.0, 142.0, 85.0, 41.0, 38.0, 15.0, 13.0, 12.0, 7.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75390625, -0.7295150756835938, -0.7051239013671875, -0.6807327270507812, -0.656341552734375, -0.6319503784179688, -0.6075592041015625, -0.5831680297851562, -0.55877685546875, -0.5343856811523438, -0.5099945068359375, -0.48560333251953125, -0.461212158203125, -0.43682098388671875, -0.4124298095703125, -0.38803863525390625, -0.3636474609375, -0.33925628662109375, -0.3148651123046875, -0.29047393798828125, -0.266082763671875, -0.24169158935546875, -0.2173004150390625, -0.19290924072265625, -0.16851806640625, -0.14412689208984375, -0.1197357177734375, -0.09534454345703125, -0.070953369140625, -0.04656219482421875, -0.0221710205078125, 0.00222015380859375, 0.026611328125, 0.05100250244140625, 0.0753936767578125, 0.09978485107421875, 0.124176025390625, 0.14856719970703125, 0.1729583740234375, 0.19734954833984375, 0.22174072265625, 0.24613189697265625, 0.2705230712890625, 0.29491424560546875, 0.319305419921875, 0.34369659423828125, 0.3680877685546875, 0.39247894287109375, 0.4168701171875, 0.44126129150390625, 0.4656524658203125, 0.49004364013671875, 0.514434814453125, 0.5388259887695312, 0.5632171630859375, 0.5876083374023438, 0.61199951171875, 0.6363906860351562, 0.6607818603515625, 0.6851730346679688, 0.709564208984375, 0.7339553833007812, 0.7583465576171875, 0.7827377319335938, 0.80712890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 0.0, 5.0, 2.0, 4.0, 4.0, 9.0, 3.0, 9.0, 7.0, 13.0, 11.0, 19.0, 23.0, 25.0, 35.0, 46.0, 47.0, 74.0, 75.0, 108.0, 95.0, 72.0, 71.0, 43.0, 39.0, 27.0, 29.0, 23.0, 21.0, 10.0, 9.0, 5.0, 5.0, 9.0, 5.0, 6.0, 4.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00012099742889404297, -0.00011753290891647339, -0.00011406838893890381, -0.00011060386896133423, -0.00010713934898376465, -0.00010367482900619507, -0.00010021030902862549, -9.674578905105591e-05, -9.328126907348633e-05, -8.981674909591675e-05, -8.635222911834717e-05, -8.288770914077759e-05, -7.942318916320801e-05, -7.595866918563843e-05, -7.249414920806885e-05, -6.902962923049927e-05, -6.556510925292969e-05, -6.210058927536011e-05, -5.863606929779053e-05, -5.517154932022095e-05, -5.170702934265137e-05, -4.824250936508179e-05, -4.477798938751221e-05, -4.131346940994263e-05, -3.784894943237305e-05, -3.438442945480347e-05, -3.091990947723389e-05, -2.7455389499664307e-05, -2.3990869522094727e-05, -2.0526349544525146e-05, -1.7061829566955566e-05, -1.3597309589385986e-05, -1.0132789611816406e-05, -6.668269634246826e-06, -3.203749656677246e-06, 2.60770320892334e-07, 3.725290298461914e-06, 7.189810276031494e-06, 1.0654330253601074e-05, 1.4118850231170654e-05, 1.7583370208740234e-05, 2.1047890186309814e-05, 2.4512410163879395e-05, 2.7976930141448975e-05, 3.1441450119018555e-05, 3.4905970096588135e-05, 3.8370490074157715e-05, 4.1835010051727295e-05, 4.5299530029296875e-05, 4.8764050006866455e-05, 5.2228569984436035e-05, 5.5693089962005615e-05, 5.9157609939575195e-05, 6.262212991714478e-05, 6.608664989471436e-05, 6.955116987228394e-05, 7.301568984985352e-05, 7.64802098274231e-05, 7.994472980499268e-05, 8.340924978256226e-05, 8.687376976013184e-05, 9.033828973770142e-05, 9.3802809715271e-05, 9.726732969284058e-05, 0.00010073184967041016]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 6.0, 5.0, 9.0, 12.0, 23.0, 30.0, 45.0, 81.0, 85.0, 182.0, 303.0, 559.0, 1131.0, 2612.0, 7115.0, 25471.0, 122801.0, 555119.0, 265674.0, 47908.0, 12135.0, 3851.0, 1613.0, 753.0, 411.0, 238.0, 130.0, 89.0, 44.0, 35.0, 18.0, 24.0, 9.0, 10.0, 7.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59521484375, -0.575836181640625, -0.55645751953125, -0.537078857421875, -0.5177001953125, -0.498321533203125, -0.47894287109375, -0.459564208984375, -0.440185546875, -0.420806884765625, -0.40142822265625, -0.382049560546875, -0.3626708984375, -0.343292236328125, -0.32391357421875, -0.304534912109375, -0.28515625, -0.265777587890625, -0.24639892578125, -0.227020263671875, -0.2076416015625, -0.188262939453125, -0.16888427734375, -0.149505615234375, -0.130126953125, -0.110748291015625, -0.09136962890625, -0.071990966796875, -0.0526123046875, -0.033233642578125, -0.01385498046875, 0.005523681640625, 0.02490234375, 0.044281005859375, 0.06365966796875, 0.083038330078125, 0.1024169921875, 0.121795654296875, 0.14117431640625, 0.160552978515625, 0.179931640625, 0.199310302734375, 0.21868896484375, 0.238067626953125, 0.2574462890625, 0.276824951171875, 0.29620361328125, 0.315582275390625, 0.3349609375, 0.354339599609375, 0.37371826171875, 0.393096923828125, 0.4124755859375, 0.431854248046875, 0.45123291015625, 0.470611572265625, 0.489990234375, 0.509368896484375, 0.52874755859375, 0.548126220703125, 0.5675048828125, 0.586883544921875, 0.60626220703125, 0.625640869140625, 0.64501953125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 1.0, 4.0, 6.0, 11.0, 8.0, 14.0, 13.0, 24.0, 27.0, 34.0, 50.0, 54.0, 91.0, 85.0, 80.0, 121.0, 88.0, 69.0, 68.0, 39.0, 25.0, 23.0, 16.0, 12.0, 9.0, 6.0, 8.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.459228515625, -0.4412803649902344, -0.42333221435546875, -0.4053840637207031, -0.3874359130859375, -0.3694877624511719, -0.35153961181640625, -0.3335914611816406, -0.315643310546875, -0.2976951599121094, -0.27974700927734375, -0.2617988586425781, -0.2438507080078125, -0.22590255737304688, -0.20795440673828125, -0.19000625610351562, -0.17205810546875, -0.15410995483398438, -0.13616180419921875, -0.11821365356445312, -0.1002655029296875, -0.08231735229492188, -0.06436920166015625, -0.046421051025390625, -0.028472900390625, -0.010524749755859375, 0.00742340087890625, 0.025371551513671875, 0.0433197021484375, 0.061267852783203125, 0.07921600341796875, 0.09716415405273438, 0.1151123046875, 0.13306045532226562, 0.15100860595703125, 0.16895675659179688, 0.1869049072265625, 0.20485305786132812, 0.22280120849609375, 0.24074935913085938, 0.258697509765625, 0.2766456604003906, 0.29459381103515625, 0.3125419616699219, 0.3304901123046875, 0.3484382629394531, 0.36638641357421875, 0.3843345642089844, 0.40228271484375, 0.4202308654785156, 0.43817901611328125, 0.4561271667480469, 0.4740753173828125, 0.4920234680175781, 0.5099716186523438, 0.5279197692871094, 0.545867919921875, 0.5638160705566406, 0.5817642211914062, 0.5997123718261719, 0.6176605224609375, 0.6356086730957031, 0.6535568237304688, 0.6715049743652344, 0.689453125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 6.0, 15.0, 17.0, 26.0, 35.0, 58.0, 77.0, 124.0, 138.0, 148.0, 120.0, 72.0, 40.0, 43.0, 13.0, 17.0, 19.0, 8.0, 7.0, 4.0, 7.0, 0.0, 5.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.742068290710449, -7.388718605041504, -7.035369396209717, -6.68202018737793, -6.328670501708984, -5.975320816040039, -5.621971607208252, -5.268622398376465, -4.9152727127075195, -4.561923027038574, -4.208573818206787, -3.855224370956421, -3.5018749237060547, -3.1485254764556885, -2.7951760292053223, -2.441826581954956, -2.08847713470459, -1.7351276874542236, -1.3817782402038574, -1.0284287929534912, -0.675079345703125, -0.3217298984527588, 0.03161954879760742, 0.38496899604797363, 0.7383184432983398, 1.091667890548706, 1.4450173377990723, 1.7983667850494385, 2.1517162322998047, 2.505065679550171, 2.858415126800537, 3.2117645740509033, 3.565114974975586, 3.918464422225952, 4.271813869476318, 4.6251630783081055, 4.978512763977051, 5.331862449645996, 5.685211658477783, 6.03856086730957, 6.391910552978516, 6.745260238647461, 7.098609447479248, 7.451958656311035, 7.8053083419799805, 8.158658027648926, 8.512006759643555, 8.8653564453125, 9.218706130981445, 9.57205581665039, 9.925405502319336, 10.278754234313965, 10.63210391998291, 10.985453605651855, 11.338802337646484, 11.69215202331543, 12.045501708984375, 12.39885139465332, 12.752201080322266, 13.105549812316895, 13.45889949798584, 13.812249183654785, 14.165597915649414, 14.51894760131836, 14.872297286987305]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 4.0, 3.0, 9.0, 2.0, 11.0, 10.0, 19.0, 17.0, 23.0, 22.0, 27.0, 31.0, 25.0, 38.0, 33.0, 46.0, 43.0, 42.0, 49.0, 42.0, 46.0, 41.0, 46.0, 50.0, 48.0, 34.0, 42.0, 30.0, 24.0, 28.0, 20.0, 18.0, 15.0, 14.0, 7.0, 13.0, 5.0, 8.0, 2.0, 1.0, 3.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.300506591796875, -11.913490295410156, -11.526474952697754, -11.139458656311035, -10.752442359924316, -10.365427017211914, -9.978410720825195, -9.591394424438477, -9.204378128051758, -8.817361831665039, -8.430346488952637, -8.043330192565918, -7.656313896179199, -7.269298076629639, -6.882282257080078, -6.495265960693359, -6.108250617980957, -5.7212347984313965, -5.334218502044678, -4.947202682495117, -4.560186386108398, -4.173170566558838, -3.7861547470092773, -3.3991386890411377, -3.012122631072998, -2.6251065731048584, -2.2380905151367188, -1.8510746955871582, -1.4640586376190186, -1.077042579650879, -0.6900267601013184, -0.3030107021331787, 0.08400535583496094, 0.4710213541984558, 0.8580373525619507, 1.2450532913208008, 1.6320693492889404, 2.01908540725708, 2.4061012268066406, 2.7931172847747803, 3.18013334274292, 3.5671494007110596, 3.954165458679199, 4.34118127822876, 4.72819709777832, 5.115213394165039, 5.5022292137146, 5.88924503326416, 6.276261329650879, 6.6632771492004395, 7.050293445587158, 7.437309265136719, 7.8243255615234375, 8.211341857910156, 8.598357200622559, 8.985373497009277, 9.37238883972168, 9.759405136108398, 10.1464204788208, 10.53343677520752, 10.920453071594238, 11.30746841430664, 11.69448471069336, 12.081501007080078, 12.468517303466797]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 5.0, 10.0, 9.0, 13.0, 10.0, 20.0, 63.0, 65.0, 118.0, 215.0, 391.0, 745.0, 1635.0, 4730.0, 17395.0, 120874.0, 3843070.0, 173561.0, 21035.0, 5614.0, 2123.0, 1018.0, 543.0, 332.0, 218.0, 142.0, 90.0, 61.0, 45.0, 32.0, 32.0, 19.0, 12.0, 7.0, 6.0, 7.0, 3.0, 3.0, 6.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.13671875, -2.0328369140625, -1.928955078125, -1.8250732421875, -1.72119140625, -1.6173095703125, -1.513427734375, -1.4095458984375, -1.3056640625, -1.2017822265625, -1.097900390625, -0.9940185546875, -0.89013671875, -0.7862548828125, -0.682373046875, -0.5784912109375, -0.474609375, -0.3707275390625, -0.266845703125, -0.1629638671875, -0.05908203125, 0.0447998046875, 0.148681640625, 0.2525634765625, 0.3564453125, 0.4603271484375, 0.564208984375, 0.6680908203125, 0.77197265625, 0.8758544921875, 0.979736328125, 1.0836181640625, 1.1875, 1.2913818359375, 1.395263671875, 1.4991455078125, 1.60302734375, 1.7069091796875, 1.810791015625, 1.9146728515625, 2.0185546875, 2.1224365234375, 2.226318359375, 2.3302001953125, 2.43408203125, 2.5379638671875, 2.641845703125, 2.7457275390625, 2.849609375, 2.9534912109375, 3.057373046875, 3.1612548828125, 3.26513671875, 3.3690185546875, 3.472900390625, 3.5767822265625, 3.6806640625, 3.7845458984375, 3.888427734375, 3.9923095703125, 4.09619140625, 4.2000732421875, 4.303955078125, 4.4078369140625, 4.51171875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 6.0, 17.0, 21.0, 28.0, 37.0, 45.0, 55.0, 73.0, 76.0, 86.0, 80.0, 78.0, 81.0, 73.0, 67.0, 52.0, 39.0, 32.0, 17.0, 10.0, 12.0, 6.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5107421875, -0.4834747314453125, -0.456207275390625, -0.4289398193359375, -0.40167236328125, -0.3744049072265625, -0.347137451171875, -0.3198699951171875, -0.2926025390625, -0.2653350830078125, -0.238067626953125, -0.2108001708984375, -0.18353271484375, -0.1562652587890625, -0.128997802734375, -0.1017303466796875, -0.074462890625, -0.0471954345703125, -0.019927978515625, 0.0073394775390625, 0.03460693359375, 0.0618743896484375, 0.089141845703125, 0.1164093017578125, 0.1436767578125, 0.1709442138671875, 0.198211669921875, 0.2254791259765625, 0.25274658203125, 0.2800140380859375, 0.307281494140625, 0.3345489501953125, 0.36181640625, 0.3890838623046875, 0.416351318359375, 0.4436187744140625, 0.47088623046875, 0.4981536865234375, 0.525421142578125, 0.5526885986328125, 0.5799560546875, 0.6072235107421875, 0.634490966796875, 0.6617584228515625, 0.68902587890625, 0.7162933349609375, 0.743560791015625, 0.7708282470703125, 0.798095703125, 0.8253631591796875, 0.852630615234375, 0.8798980712890625, 0.90716552734375, 0.9344329833984375, 0.961700439453125, 0.9889678955078125, 1.0162353515625, 1.0435028076171875, 1.070770263671875, 1.0980377197265625, 1.12530517578125, 1.1525726318359375, 1.179840087890625, 1.2071075439453125, 1.234375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 9.0, 7.0, 12.0, 16.0, 44.0, 67.0, 138.0, 264.0, 547.0, 1376.0, 3964.0, 15595.0, 182514.0, 3881259.0, 91632.0, 11439.0, 3130.0, 1156.0, 489.0, 252.0, 138.0, 76.0, 49.0, 34.0, 14.0, 11.0, 15.0, 6.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.677734375, -2.5762939453125, -2.474853515625, -2.3734130859375, -2.27197265625, -2.1705322265625, -2.069091796875, -1.9676513671875, -1.8662109375, -1.7647705078125, -1.663330078125, -1.5618896484375, -1.46044921875, -1.3590087890625, -1.257568359375, -1.1561279296875, -1.0546875, -0.9532470703125, -0.851806640625, -0.7503662109375, -0.64892578125, -0.5474853515625, -0.446044921875, -0.3446044921875, -0.2431640625, -0.1417236328125, -0.040283203125, 0.0611572265625, 0.16259765625, 0.2640380859375, 0.365478515625, 0.4669189453125, 0.568359375, 0.6697998046875, 0.771240234375, 0.8726806640625, 0.97412109375, 1.0755615234375, 1.177001953125, 1.2784423828125, 1.3798828125, 1.4813232421875, 1.582763671875, 1.6842041015625, 1.78564453125, 1.8870849609375, 1.988525390625, 2.0899658203125, 2.19140625, 2.2928466796875, 2.394287109375, 2.4957275390625, 2.59716796875, 2.6986083984375, 2.800048828125, 2.9014892578125, 3.0029296875, 3.1043701171875, 3.205810546875, 3.3072509765625, 3.40869140625, 3.5101318359375, 3.611572265625, 3.7130126953125, 3.814453125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 2.0, 4.0, 2.0, 6.0, 8.0, 6.0, 13.0, 14.0, 20.0, 56.0, 84.0, 151.0, 421.0, 1422.0, 1106.0, 382.0, 151.0, 83.0, 38.0, 29.0, 29.0, 17.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1474609375, -1.112579345703125, -1.07769775390625, -1.042816162109375, -1.0079345703125, -0.973052978515625, -0.93817138671875, -0.903289794921875, -0.868408203125, -0.833526611328125, -0.79864501953125, -0.763763427734375, -0.7288818359375, -0.694000244140625, -0.65911865234375, -0.624237060546875, -0.58935546875, -0.554473876953125, -0.51959228515625, -0.484710693359375, -0.4498291015625, -0.414947509765625, -0.38006591796875, -0.345184326171875, -0.310302734375, -0.275421142578125, -0.24053955078125, -0.205657958984375, -0.1707763671875, -0.135894775390625, -0.10101318359375, -0.066131591796875, -0.03125, 0.003631591796875, 0.03851318359375, 0.073394775390625, 0.1082763671875, 0.143157958984375, 0.17803955078125, 0.212921142578125, 0.247802734375, 0.282684326171875, 0.31756591796875, 0.352447509765625, 0.3873291015625, 0.422210693359375, 0.45709228515625, 0.491973876953125, 0.52685546875, 0.561737060546875, 0.59661865234375, 0.631500244140625, 0.6663818359375, 0.701263427734375, 0.73614501953125, 0.771026611328125, 0.805908203125, 0.840789794921875, 0.87567138671875, 0.910552978515625, 0.9454345703125, 0.980316162109375, 1.01519775390625, 1.050079345703125, 1.0849609375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 12.0, 26.0, 66.0, 154.0, 257.0, 236.0, 130.0, 51.0, 30.0, 8.0, 8.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.319116592407227, -10.072025299072266, -9.824934959411621, -9.57784366607666, -9.330753326416016, -9.083662033081055, -8.83657169342041, -8.58948040008545, -8.342390060424805, -8.095298767089844, -7.848208427429199, -7.6011176109313965, -7.354026794433594, -7.106935977935791, -6.859845161437988, -6.612753868103027, -6.365663051605225, -6.118572235107422, -5.871481418609619, -5.624390602111816, -5.377299785614014, -5.130208969116211, -4.88311767578125, -4.6360273361206055, -4.3889360427856445, -4.141845226287842, -3.894754409790039, -3.6476635932922363, -3.4005727767944336, -3.153481960296631, -2.906390905380249, -2.6593000888824463, -2.4122095108032227, -2.16511869430542, -1.9180278778076172, -1.670936942100525, -1.4238461256027222, -1.1767553091049194, -0.9296643733978271, -0.6825735569000244, -0.4354827404022217, -0.18839189410209656, 0.058698952198028564, 0.3057898283004761, 0.5528806447982788, 0.7999714612960815, 1.0470623970031738, 1.2941532135009766, 1.5412440299987793, 1.788334846496582, 2.0354256629943848, 2.2825164794921875, 2.5296072959899902, 2.776698112487793, 3.023789167404175, 3.2708799839019775, 3.5179708003997803, 3.765061616897583, 4.012152671813965, 4.259243488311768, 4.50633430480957, 4.753425121307373, 5.000515937805176, 5.2476067543029785, 5.494697570800781]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 5.0, 6.0, 13.0, 19.0, 24.0, 29.0, 26.0, 31.0, 43.0, 53.0, 68.0, 64.0, 82.0, 74.0, 65.0, 72.0, 51.0, 55.0, 36.0, 39.0, 36.0, 27.0, 25.0, 17.0, 12.0, 12.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.977710247039795, -4.8395538330078125, -4.701396942138672, -4.5632405281066895, -4.425083637237549, -4.286927223205566, -4.148770332336426, -4.010613918304443, -3.872457265853882, -3.7343006134033203, -3.596143960952759, -3.4579873085021973, -3.319830894470215, -3.181674003601074, -3.043517589569092, -2.9053609371185303, -2.7672042846679688, -2.6290476322174072, -2.4908909797668457, -2.352734327316284, -2.2145776748657227, -2.0764212608337402, -1.9382646083831787, -1.8001079559326172, -1.6619513034820557, -1.5237946510314941, -1.3856379985809326, -1.2474814653396606, -1.1093248128890991, -0.9711681604385376, -0.8330115675926208, -0.6948549747467041, -0.5566978454589844, -0.41854122281074524, -0.2803846001625061, -0.14222797751426697, -0.004071354866027832, 0.1340852975845337, 0.27224189043045044, 0.4103984832763672, 0.5485551357269287, 0.6867117881774902, 0.824868381023407, 0.9630249738693237, 1.1011816263198853, 1.2393382787704468, 1.3774948120117188, 1.5156514644622803, 1.6538081169128418, 1.7919647693634033, 1.9301214218139648, 2.0682780742645264, 2.206434726715088, 2.3445911407470703, 2.482747793197632, 2.6209044456481934, 2.759061098098755, 2.8972177505493164, 3.035374402999878, 3.1735310554504395, 3.311687469482422, 3.4498443603515625, 3.588000774383545, 3.7261574268341064, 3.864314079284668]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 9.0, 17.0, 17.0, 22.0, 30.0, 50.0, 77.0, 169.0, 280.0, 540.0, 1257.0, 3344.0, 12624.0, 71312.0, 512575.0, 381854.0, 49748.0, 9647.0, 2771.0, 1109.0, 530.0, 237.0, 119.0, 83.0, 34.0, 31.0, 25.0, 16.0, 6.0, 8.0, 2.0, 6.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.390625, -3.28436279296875, -3.1781005859375, -3.07183837890625, -2.965576171875, -2.85931396484375, -2.7530517578125, -2.64678955078125, -2.54052734375, -2.43426513671875, -2.3280029296875, -2.22174072265625, -2.115478515625, -2.00921630859375, -1.9029541015625, -1.79669189453125, -1.6904296875, -1.58416748046875, -1.4779052734375, -1.37164306640625, -1.265380859375, -1.15911865234375, -1.0528564453125, -0.94659423828125, -0.84033203125, -0.73406982421875, -0.6278076171875, -0.52154541015625, -0.415283203125, -0.30902099609375, -0.2027587890625, -0.09649658203125, 0.009765625, 0.11602783203125, 0.2222900390625, 0.32855224609375, 0.434814453125, 0.54107666015625, 0.6473388671875, 0.75360107421875, 0.85986328125, 0.96612548828125, 1.0723876953125, 1.17864990234375, 1.284912109375, 1.39117431640625, 1.4974365234375, 1.60369873046875, 1.7099609375, 1.81622314453125, 1.9224853515625, 2.02874755859375, 2.135009765625, 2.24127197265625, 2.3475341796875, 2.45379638671875, 2.56005859375, 2.66632080078125, 2.7725830078125, 2.87884521484375, 2.985107421875, 3.09136962890625, 3.1976318359375, 3.30389404296875, 3.41015625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 5.0, 9.0, 22.0, 27.0, 38.0, 40.0, 60.0, 88.0, 99.0, 88.0, 98.0, 92.0, 84.0, 77.0, 54.0, 48.0, 24.0, 19.0, 10.0, 6.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67626953125, -0.6459884643554688, -0.6157073974609375, -0.5854263305664062, -0.555145263671875, -0.5248641967773438, -0.4945831298828125, -0.46430206298828125, -0.43402099609375, -0.40373992919921875, -0.3734588623046875, -0.34317779541015625, -0.312896728515625, -0.28261566162109375, -0.2523345947265625, -0.22205352783203125, -0.1917724609375, -0.16149139404296875, -0.1312103271484375, -0.10092926025390625, -0.070648193359375, -0.04036712646484375, -0.0100860595703125, 0.02019500732421875, 0.05047607421875, 0.08075714111328125, 0.1110382080078125, 0.14131927490234375, 0.171600341796875, 0.20188140869140625, 0.2321624755859375, 0.26244354248046875, 0.292724609375, 0.32300567626953125, 0.3532867431640625, 0.38356781005859375, 0.413848876953125, 0.44412994384765625, 0.4744110107421875, 0.5046920776367188, 0.53497314453125, 0.5652542114257812, 0.5955352783203125, 0.6258163452148438, 0.656097412109375, 0.6863784790039062, 0.7166595458984375, 0.7469406127929688, 0.7772216796875, 0.8075027465820312, 0.8377838134765625, 0.8680648803710938, 0.898345947265625, 0.9286270141601562, 0.9589080810546875, 0.9891891479492188, 1.01947021484375, 1.0497512817382812, 1.0800323486328125, 1.1103134155273438, 1.140594482421875, 1.1708755493164062, 1.2011566162109375, 1.2314376831054688, 1.26171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 9.0, 11.0, 8.0, 11.0, 11.0, 23.0, 23.0, 31.0, 35.0, 46.0, 76.0, 107.0, 135.0, 247.0, 357.0, 667.0, 1235.0, 2445.0, 5282.0, 11264.0, 27084.0, 73655.0, 209663.0, 373134.0, 215072.0, 76287.0, 28595.0, 11763.0, 5425.0, 2635.0, 1311.0, 736.0, 408.0, 269.0, 162.0, 98.0, 65.0, 57.0, 34.0, 16.0, 20.0, 14.0, 13.0, 7.0, 6.0, 5.0, 4.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.462890625, -1.4178924560546875, -1.372894287109375, -1.3278961181640625, -1.28289794921875, -1.2378997802734375, -1.192901611328125, -1.1479034423828125, -1.1029052734375, -1.0579071044921875, -1.012908935546875, -0.9679107666015625, -0.92291259765625, -0.8779144287109375, -0.832916259765625, -0.7879180908203125, -0.742919921875, -0.6979217529296875, -0.652923583984375, -0.6079254150390625, -0.56292724609375, -0.5179290771484375, -0.472930908203125, -0.4279327392578125, -0.3829345703125, -0.3379364013671875, -0.292938232421875, -0.2479400634765625, -0.20294189453125, -0.1579437255859375, -0.112945556640625, -0.0679473876953125, -0.02294921875, 0.0220489501953125, 0.067047119140625, 0.1120452880859375, 0.15704345703125, 0.2020416259765625, 0.247039794921875, 0.2920379638671875, 0.3370361328125, 0.3820343017578125, 0.427032470703125, 0.4720306396484375, 0.51702880859375, 0.5620269775390625, 0.607025146484375, 0.6520233154296875, 0.697021484375, 0.7420196533203125, 0.787017822265625, 0.8320159912109375, 0.87701416015625, 0.9220123291015625, 0.967010498046875, 1.0120086669921875, 1.0570068359375, 1.1020050048828125, 1.147003173828125, 1.1920013427734375, 1.23699951171875, 1.2819976806640625, 1.326995849609375, 1.3719940185546875, 1.4169921875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 7.0, 5.0, 7.0, 4.0, 13.0, 16.0, 9.0, 15.0, 7.0, 15.0, 22.0, 24.0, 26.0, 35.0, 42.0, 34.0, 30.0, 30.0, 35.0, 35.0, 38.0, 30.0, 41.0, 40.0, 46.0, 39.0, 42.0, 40.0, 24.0, 29.0, 35.0, 24.0, 28.0, 15.0, 21.0, 17.0, 20.0, 8.0, 13.0, 11.0, 4.0, 7.0, 6.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.009765625, -1.946563720703125, -1.88336181640625, -1.820159912109375, -1.7569580078125, -1.693756103515625, -1.63055419921875, -1.567352294921875, -1.504150390625, -1.440948486328125, -1.37774658203125, -1.314544677734375, -1.2513427734375, -1.188140869140625, -1.12493896484375, -1.061737060546875, -0.99853515625, -0.935333251953125, -0.87213134765625, -0.808929443359375, -0.7457275390625, -0.682525634765625, -0.61932373046875, -0.556121826171875, -0.492919921875, -0.429718017578125, -0.36651611328125, -0.303314208984375, -0.2401123046875, -0.176910400390625, -0.11370849609375, -0.050506591796875, 0.0126953125, 0.075897216796875, 0.13909912109375, 0.202301025390625, 0.2655029296875, 0.328704833984375, 0.39190673828125, 0.455108642578125, 0.518310546875, 0.581512451171875, 0.64471435546875, 0.707916259765625, 0.7711181640625, 0.834320068359375, 0.89752197265625, 0.960723876953125, 1.02392578125, 1.087127685546875, 1.15032958984375, 1.213531494140625, 1.2767333984375, 1.339935302734375, 1.40313720703125, 1.466339111328125, 1.529541015625, 1.592742919921875, 1.65594482421875, 1.719146728515625, 1.7823486328125, 1.845550537109375, 1.90875244140625, 1.971954345703125, 2.03515625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 3.0, 6.0, 18.0, 26.0, 34.0, 76.0, 167.0, 424.0, 1688.0, 14911.0, 666951.0, 353360.0, 9021.0, 1235.0, 317.0, 152.0, 66.0, 45.0, 14.0, 13.0, 6.0, 7.0, 2.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7109375, -1.657318115234375, -1.60369873046875, -1.550079345703125, -1.4964599609375, -1.442840576171875, -1.38922119140625, -1.335601806640625, -1.281982421875, -1.228363037109375, -1.17474365234375, -1.121124267578125, -1.0675048828125, -1.013885498046875, -0.96026611328125, -0.906646728515625, -0.85302734375, -0.799407958984375, -0.74578857421875, -0.692169189453125, -0.6385498046875, -0.584930419921875, -0.53131103515625, -0.477691650390625, -0.424072265625, -0.370452880859375, -0.31683349609375, -0.263214111328125, -0.2095947265625, -0.155975341796875, -0.10235595703125, -0.048736572265625, 0.0048828125, 0.058502197265625, 0.11212158203125, 0.165740966796875, 0.2193603515625, 0.272979736328125, 0.32659912109375, 0.380218505859375, 0.433837890625, 0.487457275390625, 0.54107666015625, 0.594696044921875, 0.6483154296875, 0.701934814453125, 0.75555419921875, 0.809173583984375, 0.86279296875, 0.916412353515625, 0.97003173828125, 1.023651123046875, 1.0772705078125, 1.130889892578125, 1.18450927734375, 1.238128662109375, 1.291748046875, 1.345367431640625, 1.39898681640625, 1.452606201171875, 1.5062255859375, 1.559844970703125, 1.61346435546875, 1.667083740234375, 1.720703125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 7.0, 7.0, 9.0, 6.0, 16.0, 12.0, 16.0, 11.0, 18.0, 27.0, 33.0, 48.0, 48.0, 49.0, 74.0, 70.0, 88.0, 87.0, 60.0, 56.0, 43.0, 38.0, 28.0, 17.0, 12.0, 13.0, 16.0, 10.0, 11.0, 10.0, 4.0, 9.0, 6.0, 7.0, 3.0, 6.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 4.0], "bins": [-0.00010514259338378906, -0.00010230671614408493, -9.94708389043808e-05, -9.663496166467667e-05, -9.379908442497253e-05, -9.09632071852684e-05, -8.812732994556427e-05, -8.529145270586014e-05, -8.2455575466156e-05, -7.961969822645187e-05, -7.678382098674774e-05, -7.394794374704361e-05, -7.111206650733948e-05, -6.827618926763535e-05, -6.544031202793121e-05, -6.260443478822708e-05, -5.976855754852295e-05, -5.693268030881882e-05, -5.4096803069114685e-05, -5.126092582941055e-05, -4.842504858970642e-05, -4.558917135000229e-05, -4.275329411029816e-05, -3.9917416870594025e-05, -3.708153963088989e-05, -3.424566239118576e-05, -3.140978515148163e-05, -2.8573907911777496e-05, -2.5738030672073364e-05, -2.2902153432369232e-05, -2.00662761926651e-05, -1.7230398952960968e-05, -1.4394521713256836e-05, -1.1558644473552704e-05, -8.722767233848572e-06, -5.88688999414444e-06, -3.0510127544403076e-06, -2.1513551473617554e-07, 2.6207417249679565e-06, 5.456618964672089e-06, 8.29249620437622e-06, 1.1128373444080353e-05, 1.3964250683784485e-05, 1.6800127923488617e-05, 1.963600516319275e-05, 2.247188240289688e-05, 2.5307759642601013e-05, 2.8143636882305145e-05, 3.097951412200928e-05, 3.381539136171341e-05, 3.665126860141754e-05, 3.9487145841121674e-05, 4.2323023080825806e-05, 4.515890032052994e-05, 4.799477756023407e-05, 5.08306547999382e-05, 5.3666532039642334e-05, 5.6502409279346466e-05, 5.93382865190506e-05, 6.217416375875473e-05, 6.501004099845886e-05, 6.7845918238163e-05, 7.068179547786713e-05, 7.351767271757126e-05, 7.635354995727539e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 8.0, 1.0, 6.0, 2.0, 17.0, 12.0, 24.0, 34.0, 68.0, 103.0, 188.0, 348.0, 712.0, 1600.0, 4393.0, 20213.0, 204289.0, 714753.0, 85384.0, 11061.0, 2994.0, 1157.0, 527.0, 270.0, 153.0, 76.0, 54.0, 34.0, 18.0, 18.0, 11.0, 5.0, 4.0, 2.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.052734375, -1.021148681640625, -0.98956298828125, -0.957977294921875, -0.9263916015625, -0.894805908203125, -0.86322021484375, -0.831634521484375, -0.800048828125, -0.768463134765625, -0.73687744140625, -0.705291748046875, -0.6737060546875, -0.642120361328125, -0.61053466796875, -0.578948974609375, -0.54736328125, -0.515777587890625, -0.48419189453125, -0.452606201171875, -0.4210205078125, -0.389434814453125, -0.35784912109375, -0.326263427734375, -0.294677734375, -0.263092041015625, -0.23150634765625, -0.199920654296875, -0.1683349609375, -0.136749267578125, -0.10516357421875, -0.073577880859375, -0.0419921875, -0.010406494140625, 0.02117919921875, 0.052764892578125, 0.0843505859375, 0.115936279296875, 0.14752197265625, 0.179107666015625, 0.210693359375, 0.242279052734375, 0.27386474609375, 0.305450439453125, 0.3370361328125, 0.368621826171875, 0.40020751953125, 0.431793212890625, 0.46337890625, 0.494964599609375, 0.52655029296875, 0.558135986328125, 0.5897216796875, 0.621307373046875, 0.65289306640625, 0.684478759765625, 0.716064453125, 0.747650146484375, 0.77923583984375, 0.810821533203125, 0.8424072265625, 0.873992919921875, 0.90557861328125, 0.937164306640625, 0.96875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 8.0, 8.0, 16.0, 29.0, 51.0, 89.0, 150.0, 152.0, 184.0, 118.0, 83.0, 38.0, 37.0, 15.0, 3.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0771484375, -1.0409698486328125, -1.004791259765625, -0.9686126708984375, -0.93243408203125, -0.8962554931640625, -0.860076904296875, -0.8238983154296875, -0.7877197265625, -0.7515411376953125, -0.715362548828125, -0.6791839599609375, -0.64300537109375, -0.6068267822265625, -0.570648193359375, -0.5344696044921875, -0.498291015625, -0.4621124267578125, -0.425933837890625, -0.3897552490234375, -0.35357666015625, -0.3173980712890625, -0.281219482421875, -0.2450408935546875, -0.2088623046875, -0.1726837158203125, -0.136505126953125, -0.1003265380859375, -0.06414794921875, -0.0279693603515625, 0.008209228515625, 0.0443878173828125, 0.08056640625, 0.1167449951171875, 0.152923583984375, 0.1891021728515625, 0.22528076171875, 0.2614593505859375, 0.297637939453125, 0.3338165283203125, 0.3699951171875, 0.4061737060546875, 0.442352294921875, 0.4785308837890625, 0.51470947265625, 0.5508880615234375, 0.587066650390625, 0.6232452392578125, 0.659423828125, 0.6956024169921875, 0.731781005859375, 0.7679595947265625, 0.80413818359375, 0.8403167724609375, 0.876495361328125, 0.9126739501953125, 0.9488525390625, 0.9850311279296875, 1.021209716796875, 1.0573883056640625, 1.09356689453125, 1.1297454833984375, 1.165924072265625, 1.2021026611328125, 1.23828125]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 11.0, 27.0, 32.0, 63.0, 105.0, 174.0, 236.0, 154.0, 99.0, 45.0, 20.0, 16.0, 7.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.71102237701416, -9.18679428100586, -8.662566184997559, -8.138338088989258, -7.614110946655273, -7.089882850646973, -6.565654754638672, -6.041426658630371, -5.5171990394592285, -4.992970943450928, -4.468743324279785, -3.9445152282714844, -3.4202873706817627, -2.896059513092041, -2.3718314170837402, -1.8476035594940186, -1.3233757019042969, -0.7991477847099304, -0.27491986751556396, 0.24930810928344727, 0.773535966873169, 1.2977638244628906, 1.8219919204711914, 2.346219778060913, 2.8704476356506348, 3.3946754932403564, 3.918903350830078, 4.443131446838379, 4.96735954284668, 5.491587162017822, 6.015815258026123, 6.540042877197266, 7.06427001953125, 7.588498115539551, 8.112726211547852, 8.636953353881836, 9.161181449890137, 9.685409545898438, 10.209637641906738, 10.733865737915039, 11.258092880249023, 11.782320976257324, 12.306549072265625, 12.83077621459961, 13.35500431060791, 13.879232406616211, 14.403460502624512, 14.927688598632812, 15.451916694641113, 15.976144790649414, 16.5003719329834, 17.024600982666016, 17.548828125, 18.073055267333984, 18.5972843170166, 19.121511459350586, 19.645740509033203, 20.169967651367188, 20.694196701049805, 21.21842384338379, 21.742652893066406, 22.26688003540039, 22.791107177734375, 23.315336227416992, 23.839563369750977]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 6.0, 4.0, 5.0, 11.0, 9.0, 16.0, 14.0, 16.0, 21.0, 25.0, 21.0, 20.0, 23.0, 33.0, 37.0, 35.0, 37.0, 55.0, 44.0, 64.0, 59.0, 54.0, 37.0, 39.0, 41.0, 50.0, 32.0, 27.0, 21.0, 27.0, 24.0, 20.0, 16.0, 13.0, 11.0, 5.0, 5.0, 11.0, 7.0, 8.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.055923461914062, -14.6394681930542, -14.223012924194336, -13.806557655334473, -13.39010238647461, -12.973648071289062, -12.5571928024292, -12.140737533569336, -11.724282264709473, -11.30782699584961, -10.891371726989746, -10.474916458129883, -10.058462142944336, -9.642005920410156, -9.22555160522461, -8.809096336364746, -8.392641067504883, -7.9761857986450195, -7.559730529785156, -7.143275737762451, -6.726820468902588, -6.310365200042725, -5.8939104080200195, -5.477455139160156, -5.060999870300293, -4.64454460144043, -4.228089332580566, -3.8116345405578613, -3.395179271697998, -2.9787240028381348, -2.5622689723968506, -2.1458139419555664, -1.7293577194213867, -1.312902569770813, -0.8964474201202393, -0.4799922704696655, -0.0635371208190918, 0.3529181480407715, 0.7693731784820557, 1.1858282089233398, 1.6022834777832031, 2.0187387466430664, 2.4351937770843506, 2.8516488075256348, 3.268104076385498, 3.6845593452453613, 4.101014137268066, 4.51746940612793, 4.933924674987793, 5.350379943847656, 5.7668352127075195, 6.183290004730225, 6.599745273590088, 7.016200542449951, 7.432655334472656, 7.8491106033325195, 8.265565872192383, 8.682021141052246, 9.09847640991211, 9.514931678771973, 9.931386947631836, 10.347841262817383, 10.764296531677246, 11.18075180053711, 11.597207069396973]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 2.0, 6.0, 5.0, 10.0, 17.0, 13.0, 20.0, 38.0, 85.0, 110.0, 237.0, 389.0, 835.0, 2250.0, 7001.0, 30109.0, 626242.0, 3467328.0, 44566.0, 9158.0, 2896.0, 1277.0, 594.0, 334.0, 232.0, 160.0, 98.0, 71.0, 51.0, 36.0, 30.0, 24.0, 18.0, 9.0, 8.0, 8.0, 7.0, 5.0, 4.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.751953125, -1.6761474609375, -1.600341796875, -1.5245361328125, -1.44873046875, -1.3729248046875, -1.297119140625, -1.2213134765625, -1.1455078125, -1.0697021484375, -0.993896484375, -0.9180908203125, -0.84228515625, -0.7664794921875, -0.690673828125, -0.6148681640625, -0.5390625, -0.4632568359375, -0.387451171875, -0.3116455078125, -0.23583984375, -0.1600341796875, -0.084228515625, -0.0084228515625, 0.0673828125, 0.1431884765625, 0.218994140625, 0.2947998046875, 0.37060546875, 0.4464111328125, 0.522216796875, 0.5980224609375, 0.673828125, 0.7496337890625, 0.825439453125, 0.9012451171875, 0.97705078125, 1.0528564453125, 1.128662109375, 1.2044677734375, 1.2802734375, 1.3560791015625, 1.431884765625, 1.5076904296875, 1.58349609375, 1.6593017578125, 1.735107421875, 1.8109130859375, 1.88671875, 1.9625244140625, 2.038330078125, 2.1141357421875, 2.18994140625, 2.2657470703125, 2.341552734375, 2.4173583984375, 2.4931640625, 2.5689697265625, 2.644775390625, 2.7205810546875, 2.79638671875, 2.8721923828125, 2.947998046875, 3.0238037109375, 3.099609375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 18.0, 21.0, 39.0, 28.0, 44.0, 64.0, 66.0, 83.0, 93.0, 78.0, 97.0, 79.0, 67.0, 52.0, 43.0, 30.0, 27.0, 24.0, 7.0, 9.0, 6.0, 8.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5879898071289062, -0.5592803955078125, -0.5305709838867188, -0.501861572265625, -0.47315216064453125, -0.4444427490234375, -0.41573333740234375, -0.38702392578125, -0.35831451416015625, -0.3296051025390625, -0.30089569091796875, -0.272186279296875, -0.24347686767578125, -0.2147674560546875, -0.18605804443359375, -0.1573486328125, -0.12863922119140625, -0.0999298095703125, -0.07122039794921875, -0.042510986328125, -0.01380157470703125, 0.0149078369140625, 0.04361724853515625, 0.07232666015625, 0.10103607177734375, 0.1297454833984375, 0.15845489501953125, 0.187164306640625, 0.21587371826171875, 0.2445831298828125, 0.27329254150390625, 0.302001953125, 0.33071136474609375, 0.3594207763671875, 0.38813018798828125, 0.416839599609375, 0.44554901123046875, 0.4742584228515625, 0.5029678344726562, 0.53167724609375, 0.5603866577148438, 0.5890960693359375, 0.6178054809570312, 0.646514892578125, 0.6752243041992188, 0.7039337158203125, 0.7326431274414062, 0.7613525390625, 0.7900619506835938, 0.8187713623046875, 0.8474807739257812, 0.876190185546875, 0.9048995971679688, 0.9336090087890625, 0.9623184204101562, 0.99102783203125, 1.0197372436523438, 1.0484466552734375, 1.0771560668945312, 1.105865478515625, 1.1345748901367188, 1.1632843017578125, 1.1919937133789062, 1.220703125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 3.0, 9.0, 14.0, 30.0, 75.0, 166.0, 323.0, 797.0, 2822.0, 13732.0, 222350.0, 3889385.0, 55143.0, 6750.0, 1687.0, 587.0, 216.0, 113.0, 43.0, 14.0, 12.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2421875, -3.1617584228515625, -3.081329345703125, -3.0009002685546875, -2.92047119140625, -2.8400421142578125, -2.759613037109375, -2.6791839599609375, -2.5987548828125, -2.5183258056640625, -2.437896728515625, -2.3574676513671875, -2.27703857421875, -2.1966094970703125, -2.116180419921875, -2.0357513427734375, -1.955322265625, -1.8748931884765625, -1.794464111328125, -1.7140350341796875, -1.63360595703125, -1.5531768798828125, -1.472747802734375, -1.3923187255859375, -1.3118896484375, -1.2314605712890625, -1.151031494140625, -1.0706024169921875, -0.99017333984375, -0.9097442626953125, -0.829315185546875, -0.7488861083984375, -0.66845703125, -0.5880279541015625, -0.507598876953125, -0.4271697998046875, -0.34674072265625, -0.2663116455078125, -0.185882568359375, -0.1054534912109375, -0.0250244140625, 0.0554046630859375, 0.135833740234375, 0.2162628173828125, 0.29669189453125, 0.3771209716796875, 0.457550048828125, 0.5379791259765625, 0.618408203125, 0.6988372802734375, 0.779266357421875, 0.8596954345703125, 0.94012451171875, 1.0205535888671875, 1.100982666015625, 1.1814117431640625, 1.2618408203125, 1.3422698974609375, 1.422698974609375, 1.5031280517578125, 1.58355712890625, 1.6639862060546875, 1.744415283203125, 1.8248443603515625, 1.9052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 9.0, 4.0, 6.0, 9.0, 13.0, 9.0, 21.0, 41.0, 33.0, 73.0, 135.0, 328.0, 1152.0, 1471.0, 391.0, 152.0, 82.0, 47.0, 29.0, 25.0, 14.0, 11.0, 1.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.72998046875, -0.7097625732421875, -0.689544677734375, -0.6693267822265625, -0.64910888671875, -0.6288909912109375, -0.608673095703125, -0.5884552001953125, -0.5682373046875, -0.5480194091796875, -0.527801513671875, -0.5075836181640625, -0.48736572265625, -0.4671478271484375, -0.446929931640625, -0.4267120361328125, -0.406494140625, -0.3862762451171875, -0.366058349609375, -0.3458404541015625, -0.32562255859375, -0.3054046630859375, -0.285186767578125, -0.2649688720703125, -0.2447509765625, -0.2245330810546875, -0.204315185546875, -0.1840972900390625, -0.16387939453125, -0.1436614990234375, -0.123443603515625, -0.1032257080078125, -0.0830078125, -0.0627899169921875, -0.042572021484375, -0.0223541259765625, -0.00213623046875, 0.0180816650390625, 0.038299560546875, 0.0585174560546875, 0.0787353515625, 0.0989532470703125, 0.119171142578125, 0.1393890380859375, 0.15960693359375, 0.1798248291015625, 0.200042724609375, 0.2202606201171875, 0.240478515625, 0.2606964111328125, 0.280914306640625, 0.3011322021484375, 0.32135009765625, 0.3415679931640625, 0.361785888671875, 0.3820037841796875, 0.4022216796875, 0.4224395751953125, 0.442657470703125, 0.4628753662109375, 0.48309326171875, 0.5033111572265625, 0.523529052734375, 0.5437469482421875, 0.56396484375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 10.0, 33.0, 113.0, 336.0, 334.0, 127.0, 38.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.283117294311523, -12.043548583984375, -11.803980827331543, -11.564412117004395, -11.324844360351562, -11.085275650024414, -10.845707893371582, -10.606139183044434, -10.366571426391602, -10.127002716064453, -9.887434959411621, -9.647866249084473, -9.40829849243164, -9.168729782104492, -8.92916202545166, -8.689593315124512, -8.450024604797363, -8.210455894470215, -7.970888137817383, -7.731319904327393, -7.491751670837402, -7.252182960510254, -7.012614727020264, -6.773046493530273, -6.533478260040283, -6.293910026550293, -6.054341793060303, -5.8147735595703125, -5.575204849243164, -5.335637092590332, -5.096068382263184, -4.856500148773193, -4.616932392120361, -4.377364158630371, -4.137795925140381, -3.8982274532318115, -3.6586592197418213, -3.419090986251831, -3.1795225143432617, -2.9399542808532715, -2.7003860473632812, -2.460817813873291, -2.221249580383301, -1.9816811084747314, -1.7421128749847412, -1.502544641494751, -1.2629762887954712, -1.0234079360961914, -0.7838397026062012, -0.5442714095115662, -0.30470311641693115, -0.06513482332229614, 0.17443346977233887, 0.4140017032623291, 0.6535700559616089, 0.8931384086608887, 1.132706642150879, 1.3722748756408691, 1.611843228340149, 1.8514115810394287, 2.090979814529419, 2.330548048019409, 2.5701165199279785, 2.8096847534179688, 3.049252986907959]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 8.0, 10.0, 19.0, 25.0, 16.0, 29.0, 39.0, 25.0, 39.0, 47.0, 37.0, 43.0, 48.0, 38.0, 50.0, 77.0, 53.0, 52.0, 42.0, 38.0, 37.0, 31.0, 32.0, 30.0, 21.0, 31.0, 14.0, 19.0, 7.0, 14.0, 3.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0656962394714355, -1.9971067905426025, -1.9285173416137695, -1.859928011894226, -1.791338562965393, -1.72274911403656, -1.6541597843170166, -1.5855703353881836, -1.5169808864593506, -1.4483914375305176, -1.3798019886016846, -1.3112126588821411, -1.242623209953308, -1.174033761024475, -1.1054444313049316, -1.0368549823760986, -0.9682655334472656, -0.8996760845184326, -0.8310866951942444, -0.7624973058700562, -0.6939078569412231, -0.6253184080123901, -0.5567290186882019, -0.4881395995616913, -0.41955018043518066, -0.35096076130867004, -0.2823713421821594, -0.2137819230556488, -0.14519250392913818, -0.07660308480262756, -0.008013665676116943, 0.06057575345039368, 0.1291654109954834, 0.19775483012199402, 0.26634424924850464, 0.33493366837501526, 0.4035230875015259, 0.4721125066280365, 0.5407019257545471, 0.6092913150787354, 0.6778807640075684, 0.7464702129364014, 0.8150596022605896, 0.8836489915847778, 0.9522384405136108, 1.0208278894424438, 1.0894172191619873, 1.1580066680908203, 1.2265961170196533, 1.2951855659484863, 1.3637750148773193, 1.4323643445968628, 1.5009537935256958, 1.5695432424545288, 1.6381325721740723, 1.7067220211029053, 1.7753114700317383, 1.8439009189605713, 1.9124903678894043, 1.9810796976089478, 2.0496692657470703, 2.118258476257324, 2.1868479251861572, 2.2554373741149902, 2.3240268230438232]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 5.0, 1.0, 10.0, 8.0, 16.0, 10.0, 15.0, 19.0, 28.0, 44.0, 56.0, 57.0, 87.0, 131.0, 183.0, 315.0, 537.0, 973.0, 1871.0, 4135.0, 9772.0, 26083.0, 83923.0, 295142.0, 417749.0, 140422.0, 41452.0, 14324.0, 5752.0, 2534.0, 1180.0, 678.0, 365.0, 205.0, 153.0, 96.0, 57.0, 45.0, 35.0, 16.0, 15.0, 21.0, 7.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.8603515625, -1.7987518310546875, -1.737152099609375, -1.6755523681640625, -1.61395263671875, -1.5523529052734375, -1.490753173828125, -1.4291534423828125, -1.3675537109375, -1.3059539794921875, -1.244354248046875, -1.1827545166015625, -1.12115478515625, -1.0595550537109375, -0.997955322265625, -0.9363555908203125, -0.874755859375, -0.8131561279296875, -0.751556396484375, -0.6899566650390625, -0.62835693359375, -0.5667572021484375, -0.505157470703125, -0.4435577392578125, -0.3819580078125, -0.3203582763671875, -0.258758544921875, -0.1971588134765625, -0.13555908203125, -0.0739593505859375, -0.012359619140625, 0.0492401123046875, 0.11083984375, 0.1724395751953125, 0.234039306640625, 0.2956390380859375, 0.35723876953125, 0.4188385009765625, 0.480438232421875, 0.5420379638671875, 0.6036376953125, 0.6652374267578125, 0.726837158203125, 0.7884368896484375, 0.85003662109375, 0.9116363525390625, 0.973236083984375, 1.0348358154296875, 1.096435546875, 1.1580352783203125, 1.219635009765625, 1.2812347412109375, 1.34283447265625, 1.4044342041015625, 1.466033935546875, 1.5276336669921875, 1.5892333984375, 1.6508331298828125, 1.712432861328125, 1.7740325927734375, 1.83563232421875, 1.8972320556640625, 1.958831787109375, 2.0204315185546875, 2.08203125]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 12.0, 21.0, 22.0, 37.0, 48.0, 49.0, 78.0, 70.0, 100.0, 102.0, 82.0, 91.0, 76.0, 47.0, 47.0, 35.0, 30.0, 15.0, 14.0, 6.0, 6.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71875, -0.6883697509765625, -0.657989501953125, -0.6276092529296875, -0.59722900390625, -0.5668487548828125, -0.536468505859375, -0.5060882568359375, -0.4757080078125, -0.4453277587890625, -0.414947509765625, -0.3845672607421875, -0.35418701171875, -0.3238067626953125, -0.293426513671875, -0.2630462646484375, -0.232666015625, -0.2022857666015625, -0.171905517578125, -0.1415252685546875, -0.11114501953125, -0.0807647705078125, -0.050384521484375, -0.0200042724609375, 0.0103759765625, 0.0407562255859375, 0.071136474609375, 0.1015167236328125, 0.13189697265625, 0.1622772216796875, 0.192657470703125, 0.2230377197265625, 0.25341796875, 0.2837982177734375, 0.314178466796875, 0.3445587158203125, 0.37493896484375, 0.4053192138671875, 0.435699462890625, 0.4660797119140625, 0.4964599609375, 0.5268402099609375, 0.557220458984375, 0.5876007080078125, 0.61798095703125, 0.6483612060546875, 0.678741455078125, 0.7091217041015625, 0.739501953125, 0.7698822021484375, 0.800262451171875, 0.8306427001953125, 0.86102294921875, 0.8914031982421875, 0.921783447265625, 0.9521636962890625, 0.9825439453125, 1.0129241943359375, 1.043304443359375, 1.0736846923828125, 1.10406494140625, 1.1344451904296875, 1.164825439453125, 1.1952056884765625, 1.2255859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 6.0, 7.0, 11.0, 19.0, 16.0, 22.0, 41.0, 50.0, 77.0, 130.0, 214.0, 257.0, 387.0, 692.0, 1197.0, 2316.0, 4876.0, 10943.0, 28570.0, 82993.0, 249201.0, 387627.0, 182260.0, 58784.0, 21043.0, 8419.0, 3737.0, 1836.0, 1060.0, 607.0, 350.0, 247.0, 170.0, 111.0, 90.0, 65.0, 38.0, 25.0, 21.0, 10.0, 11.0, 5.0, 7.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.318359375, -1.2749176025390625, -1.231475830078125, -1.1880340576171875, -1.14459228515625, -1.1011505126953125, -1.057708740234375, -1.0142669677734375, -0.9708251953125, -0.9273834228515625, -0.883941650390625, -0.8404998779296875, -0.79705810546875, -0.7536163330078125, -0.710174560546875, -0.6667327880859375, -0.623291015625, -0.5798492431640625, -0.536407470703125, -0.4929656982421875, -0.44952392578125, -0.4060821533203125, -0.362640380859375, -0.3191986083984375, -0.2757568359375, -0.2323150634765625, -0.188873291015625, -0.1454315185546875, -0.10198974609375, -0.0585479736328125, -0.015106201171875, 0.0283355712890625, 0.07177734375, 0.1152191162109375, 0.158660888671875, 0.2021026611328125, 0.24554443359375, 0.2889862060546875, 0.332427978515625, 0.3758697509765625, 0.4193115234375, 0.4627532958984375, 0.506195068359375, 0.5496368408203125, 0.59307861328125, 0.6365203857421875, 0.679962158203125, 0.7234039306640625, 0.766845703125, 0.8102874755859375, 0.853729248046875, 0.8971710205078125, 0.94061279296875, 0.9840545654296875, 1.027496337890625, 1.0709381103515625, 1.1143798828125, 1.1578216552734375, 1.201263427734375, 1.2447052001953125, 1.28814697265625, 1.3315887451171875, 1.375030517578125, 1.4184722900390625, 1.4619140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 5.0, 3.0, 9.0, 7.0, 8.0, 13.0, 15.0, 15.0, 17.0, 22.0, 30.0, 39.0, 43.0, 35.0, 52.0, 56.0, 41.0, 45.0, 61.0, 59.0, 46.0, 61.0, 55.0, 42.0, 33.0, 34.0, 24.0, 26.0, 21.0, 20.0, 13.0, 19.0, 12.0, 9.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.541015625, -2.460418701171875, -2.37982177734375, -2.299224853515625, -2.2186279296875, -2.138031005859375, -2.05743408203125, -1.976837158203125, -1.896240234375, -1.815643310546875, -1.73504638671875, -1.654449462890625, -1.5738525390625, -1.493255615234375, -1.41265869140625, -1.332061767578125, -1.25146484375, -1.170867919921875, -1.09027099609375, -1.009674072265625, -0.9290771484375, -0.848480224609375, -0.76788330078125, -0.687286376953125, -0.606689453125, -0.526092529296875, -0.44549560546875, -0.364898681640625, -0.2843017578125, -0.203704833984375, -0.12310791015625, -0.042510986328125, 0.0380859375, 0.118682861328125, 0.19927978515625, 0.279876708984375, 0.3604736328125, 0.441070556640625, 0.52166748046875, 0.602264404296875, 0.682861328125, 0.763458251953125, 0.84405517578125, 0.924652099609375, 1.0052490234375, 1.085845947265625, 1.16644287109375, 1.247039794921875, 1.32763671875, 1.408233642578125, 1.48883056640625, 1.569427490234375, 1.6500244140625, 1.730621337890625, 1.81121826171875, 1.891815185546875, 1.972412109375, 2.053009033203125, 2.13360595703125, 2.214202880859375, 2.2947998046875, 2.375396728515625, 2.45599365234375, 2.536590576171875, 2.6171875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 7.0, 15.0, 1.0, 17.0, 18.0, 29.0, 58.0, 112.0, 163.0, 343.0, 839.0, 2340.0, 8033.0, 34692.0, 200234.0, 596793.0, 164761.0, 29380.0, 7079.0, 2139.0, 798.0, 322.0, 162.0, 86.0, 52.0, 31.0, 18.0, 6.0, 8.0, 2.0, 7.0, 3.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.59765625, -0.5758819580078125, -0.554107666015625, -0.5323333740234375, -0.51055908203125, -0.4887847900390625, -0.467010498046875, -0.4452362060546875, -0.4234619140625, -0.4016876220703125, -0.379913330078125, -0.3581390380859375, -0.33636474609375, -0.3145904541015625, -0.292816162109375, -0.2710418701171875, -0.249267578125, -0.2274932861328125, -0.205718994140625, -0.1839447021484375, -0.16217041015625, -0.1403961181640625, -0.118621826171875, -0.0968475341796875, -0.0750732421875, -0.0532989501953125, -0.031524658203125, -0.0097503662109375, 0.01202392578125, 0.0337982177734375, 0.055572509765625, 0.0773468017578125, 0.09912109375, 0.1208953857421875, 0.142669677734375, 0.1644439697265625, 0.18621826171875, 0.2079925537109375, 0.229766845703125, 0.2515411376953125, 0.2733154296875, 0.2950897216796875, 0.316864013671875, 0.3386383056640625, 0.36041259765625, 0.3821868896484375, 0.403961181640625, 0.4257354736328125, 0.447509765625, 0.4692840576171875, 0.491058349609375, 0.5128326416015625, 0.53460693359375, 0.5563812255859375, 0.578155517578125, 0.5999298095703125, 0.6217041015625, 0.6434783935546875, 0.665252685546875, 0.6870269775390625, 0.70880126953125, 0.7305755615234375, 0.752349853515625, 0.7741241455078125, 0.7958984375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 3.0, 8.0, 5.0, 7.0, 7.0, 8.0, 12.0, 13.0, 16.0, 28.0, 39.0, 43.0, 55.0, 77.0, 90.0, 137.0, 110.0, 76.0, 55.0, 36.0, 36.0, 25.0, 37.0, 18.0, 21.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.0001735687255859375, -0.0001690927892923355, -0.00016461685299873352, -0.00016014091670513153, -0.00015566498041152954, -0.00015118904411792755, -0.00014671310782432556, -0.00014223717153072357, -0.00013776123523712158, -0.0001332852989435196, -0.0001288093626499176, -0.0001243334263563156, -0.00011985749006271362, -0.00011538155376911163, -0.00011090561747550964, -0.00010642968118190765, -0.00010195374488830566, -9.747780859470367e-05, -9.300187230110168e-05, -8.85259360074997e-05, -8.40499997138977e-05, -7.957406342029572e-05, -7.509812712669373e-05, -7.062219083309174e-05, -6.614625453948975e-05, -6.167031824588776e-05, -5.7194381952285767e-05, -5.271844565868378e-05, -4.824250936508179e-05, -4.37665730714798e-05, -3.929063677787781e-05, -3.481470048427582e-05, -3.0338764190673828e-05, -2.586282789707184e-05, -2.138689160346985e-05, -1.691095530986786e-05, -1.2435019016265869e-05, -7.95908272266388e-06, -3.4831464290618896e-06, 9.927898645401e-07, 5.46872615814209e-06, 9.94466245174408e-06, 1.442059874534607e-05, 1.889653503894806e-05, 2.337247133255005e-05, 2.784840762615204e-05, 3.232434391975403e-05, 3.680028021335602e-05, 4.127621650695801e-05, 4.575215280056e-05, 5.022808909416199e-05, 5.470402538776398e-05, 5.917996168136597e-05, 6.365589797496796e-05, 6.813183426856995e-05, 7.260777056217194e-05, 7.708370685577393e-05, 8.155964314937592e-05, 8.60355794429779e-05, 9.05115157365799e-05, 9.498745203018188e-05, 9.946338832378387e-05, 0.00010393932461738586, 0.00010841526091098785, 0.00011289119720458984]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 20.0, 12.0, 22.0, 38.0, 61.0, 67.0, 92.0, 159.0, 226.0, 444.0, 711.0, 1495.0, 3454.0, 9277.0, 29507.0, 108457.0, 451307.0, 331876.0, 77066.0, 21767.0, 6926.0, 2679.0, 1202.0, 626.0, 358.0, 215.0, 149.0, 110.0, 64.0, 49.0, 30.0, 24.0, 13.0, 14.0, 9.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6041793823242188, -0.5858001708984375, -0.5674209594726562, -0.549041748046875, -0.5306625366210938, -0.5122833251953125, -0.49390411376953125, -0.47552490234375, -0.45714569091796875, -0.4387664794921875, -0.42038726806640625, -0.402008056640625, -0.38362884521484375, -0.3652496337890625, -0.34687042236328125, -0.3284912109375, -0.31011199951171875, -0.2917327880859375, -0.27335357666015625, -0.254974365234375, -0.23659515380859375, -0.2182159423828125, -0.19983673095703125, -0.18145751953125, -0.16307830810546875, -0.1446990966796875, -0.12631988525390625, -0.107940673828125, -0.08956146240234375, -0.0711822509765625, -0.05280303955078125, -0.034423828125, -0.01604461669921875, 0.0023345947265625, 0.02071380615234375, 0.039093017578125, 0.05747222900390625, 0.0758514404296875, 0.09423065185546875, 0.11260986328125, 0.13098907470703125, 0.1493682861328125, 0.16774749755859375, 0.186126708984375, 0.20450592041015625, 0.2228851318359375, 0.24126434326171875, 0.2596435546875, 0.27802276611328125, 0.2964019775390625, 0.31478118896484375, 0.333160400390625, 0.35153961181640625, 0.3699188232421875, 0.38829803466796875, 0.40667724609375, 0.42505645751953125, 0.4434356689453125, 0.46181488037109375, 0.480194091796875, 0.49857330322265625, 0.5169525146484375, 0.5353317260742188, 0.5537109375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 8.0, 8.0, 14.0, 11.0, 14.0, 20.0, 19.0, 46.0, 49.0, 52.0, 74.0, 75.0, 92.0, 91.0, 66.0, 81.0, 57.0, 53.0, 48.0, 27.0, 21.0, 13.0, 17.0, 12.0, 5.0, 3.0, 5.0, 5.0, 0.0, 6.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.666015625, -0.6464462280273438, -0.6268768310546875, -0.6073074340820312, -0.587738037109375, -0.5681686401367188, -0.5485992431640625, -0.5290298461914062, -0.50946044921875, -0.48989105224609375, -0.4703216552734375, -0.45075225830078125, -0.431182861328125, -0.41161346435546875, -0.3920440673828125, -0.37247467041015625, -0.3529052734375, -0.33333587646484375, -0.3137664794921875, -0.29419708251953125, -0.274627685546875, -0.25505828857421875, -0.2354888916015625, -0.21591949462890625, -0.19635009765625, -0.17678070068359375, -0.1572113037109375, -0.13764190673828125, -0.118072509765625, -0.09850311279296875, -0.0789337158203125, -0.05936431884765625, -0.039794921875, -0.02022552490234375, -0.0006561279296875, 0.01891326904296875, 0.038482666015625, 0.05805206298828125, 0.0776214599609375, 0.09719085693359375, 0.11676025390625, 0.13632965087890625, 0.1558990478515625, 0.17546844482421875, 0.195037841796875, 0.21460723876953125, 0.2341766357421875, 0.25374603271484375, 0.2733154296875, 0.29288482666015625, 0.3124542236328125, 0.33202362060546875, 0.351593017578125, 0.37116241455078125, 0.3907318115234375, 0.41030120849609375, 0.42987060546875, 0.44944000244140625, 0.4690093994140625, 0.48857879638671875, 0.508148193359375, 0.5277175903320312, 0.5472869873046875, 0.5668563842773438, 0.58642578125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 9.0, 5.0, 7.0, 11.0, 16.0, 17.0, 34.0, 37.0, 51.0, 66.0, 71.0, 105.0, 111.0, 100.0, 94.0, 68.0, 45.0, 38.0, 31.0, 20.0, 10.0, 18.0, 5.0, 3.0, 6.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.334507465362549, -7.079100608825684, -6.823693752288818, -6.568286895751953, -6.312880516052246, -6.057473659515381, -5.802066802978516, -5.54665994644165, -5.291253089904785, -5.03584623336792, -4.780439376831055, -4.525032997131348, -4.269626140594482, -4.014219284057617, -3.758812427520752, -3.5034055709838867, -3.2479991912841797, -2.9925923347473145, -2.7371857166290283, -2.481778860092163, -2.226372241973877, -1.9709653854370117, -1.7155585289001465, -1.4601517915725708, -1.2047450542449951, -0.9493383169174194, -0.693931519985199, -0.4385247230529785, -0.18311798572540283, 0.07228875160217285, 0.3276956081390381, 0.5831023454666138, 0.8385095596313477, 1.0939162969589233, 1.349323034286499, 1.6047298908233643, 1.86013662815094, 2.1155433654785156, 2.370950222015381, 2.626357078552246, 2.8817636966705322, 3.1371705532073975, 3.3925771713256836, 3.647984027862549, 3.903390884399414, 4.158797264099121, 4.4142045974731445, 4.669610977172852, 4.925017833709717, 5.180424690246582, 5.435831546783447, 5.6912384033203125, 5.9466447830200195, 6.202051639556885, 6.45745849609375, 6.712865352630615, 6.9682722091674805, 7.223679065704346, 7.479085922241211, 7.734492301940918, 7.989899158477783, 8.245306015014648, 8.500713348388672, 8.756119728088379, 9.011526107788086]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 8.0, 7.0, 7.0, 11.0, 9.0, 17.0, 19.0, 23.0, 17.0, 31.0, 28.0, 40.0, 36.0, 48.0, 39.0, 39.0, 56.0, 48.0, 48.0, 50.0, 43.0, 41.0, 41.0, 31.0, 23.0, 28.0, 31.0, 25.0, 23.0, 22.0, 16.0, 13.0, 15.0, 9.0, 6.0, 7.0, 5.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.732096672058105, -11.347393989562988, -10.962692260742188, -10.57798957824707, -10.19328784942627, -9.808585166931152, -9.423883438110352, -9.039180755615234, -8.654478073120117, -8.269775390625, -7.885073661804199, -7.500370979309082, -7.115669250488281, -6.730966567993164, -6.346264362335205, -5.961562156677246, -5.576860427856445, -5.192158222198486, -4.807456016540527, -4.42275333404541, -4.038051605224609, -3.6533491611480713, -3.268646717071533, -2.883944511413574, -2.4992423057556152, -2.1145401000976562, -1.7298377752304077, -1.3451354503631592, -0.9604332447052002, -0.5757310390472412, -0.19102859497070312, 0.19367361068725586, 0.5783748626708984, 0.9630771279335022, 1.347779393196106, 1.7324817180633545, 2.1171839237213135, 2.5018861293792725, 2.8865885734558105, 3.2712907791137695, 3.6559929847717285, 4.0406951904296875, 4.4253973960876465, 4.8100996017456055, 5.194802284240723, 5.579504013061523, 5.964206695556641, 6.3489089012146, 6.733611106872559, 7.118313312530518, 7.503015518188477, 7.887718200683594, 8.272419929504395, 8.657122611999512, 9.041824340820312, 9.42652702331543, 9.811229705810547, 10.195932388305664, 10.580634117126465, 10.965336799621582, 11.350038528442383, 11.7347412109375, 12.119443893432617, 12.504145622253418, 12.888847351074219]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 6.0, 11.0, 12.0, 29.0, 47.0, 62.0, 126.0, 259.0, 564.0, 1395.0, 4550.0, 21487.0, 426830.0, 3687038.0, 40093.0, 7422.0, 2263.0, 953.0, 447.0, 261.0, 155.0, 106.0, 52.0, 36.0, 30.0, 16.0, 12.0, 12.0, 2.0, 3.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.224609375, -2.1285400390625, -2.032470703125, -1.9364013671875, -1.84033203125, -1.7442626953125, -1.648193359375, -1.5521240234375, -1.4560546875, -1.3599853515625, -1.263916015625, -1.1678466796875, -1.07177734375, -0.9757080078125, -0.879638671875, -0.7835693359375, -0.6875, -0.5914306640625, -0.495361328125, -0.3992919921875, -0.30322265625, -0.2071533203125, -0.111083984375, -0.0150146484375, 0.0810546875, 0.1771240234375, 0.273193359375, 0.3692626953125, 0.46533203125, 0.5614013671875, 0.657470703125, 0.7535400390625, 0.849609375, 0.9456787109375, 1.041748046875, 1.1378173828125, 1.23388671875, 1.3299560546875, 1.426025390625, 1.5220947265625, 1.6181640625, 1.7142333984375, 1.810302734375, 1.9063720703125, 2.00244140625, 2.0985107421875, 2.194580078125, 2.2906494140625, 2.38671875, 2.4827880859375, 2.578857421875, 2.6749267578125, 2.77099609375, 2.8670654296875, 2.963134765625, 3.0592041015625, 3.1552734375, 3.2513427734375, 3.347412109375, 3.4434814453125, 3.53955078125, 3.6356201171875, 3.731689453125, 3.8277587890625, 3.923828125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 9.0, 1.0, 8.0, 17.0, 13.0, 20.0, 36.0, 60.0, 63.0, 66.0, 72.0, 70.0, 89.0, 81.0, 85.0, 82.0, 55.0, 39.0, 40.0, 35.0, 21.0, 16.0, 11.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.71484375, -0.683563232421875, -0.65228271484375, -0.621002197265625, -0.5897216796875, -0.558441162109375, -0.52716064453125, -0.495880126953125, -0.464599609375, -0.433319091796875, -0.40203857421875, -0.370758056640625, -0.3394775390625, -0.308197021484375, -0.27691650390625, -0.245635986328125, -0.21435546875, -0.183074951171875, -0.15179443359375, -0.120513916015625, -0.0892333984375, -0.057952880859375, -0.02667236328125, 0.004608154296875, 0.035888671875, 0.067169189453125, 0.09844970703125, 0.129730224609375, 0.1610107421875, 0.192291259765625, 0.22357177734375, 0.254852294921875, 0.2861328125, 0.317413330078125, 0.34869384765625, 0.379974365234375, 0.4112548828125, 0.442535400390625, 0.47381591796875, 0.505096435546875, 0.536376953125, 0.567657470703125, 0.59893798828125, 0.630218505859375, 0.6614990234375, 0.692779541015625, 0.72406005859375, 0.755340576171875, 0.78662109375, 0.817901611328125, 0.84918212890625, 0.880462646484375, 0.9117431640625, 0.943023681640625, 0.97430419921875, 1.005584716796875, 1.036865234375, 1.068145751953125, 1.09942626953125, 1.130706787109375, 1.1619873046875, 1.193267822265625, 1.22454833984375, 1.255828857421875, 1.287109375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 4.0, 8.0, 10.0, 19.0, 31.0, 87.0, 189.0, 417.0, 1004.0, 2785.0, 9178.0, 43841.0, 1100762.0, 2956679.0, 62911.0, 11255.0, 3180.0, 1108.0, 429.0, 190.0, 88.0, 58.0, 24.0, 8.0, 5.0, 10.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3935546875, -1.3357086181640625, -1.277862548828125, -1.2200164794921875, -1.16217041015625, -1.1043243408203125, -1.046478271484375, -0.9886322021484375, -0.9307861328125, -0.8729400634765625, -0.815093994140625, -0.7572479248046875, -0.69940185546875, -0.6415557861328125, -0.583709716796875, -0.5258636474609375, -0.468017578125, -0.4101715087890625, -0.352325439453125, -0.2944793701171875, -0.23663330078125, -0.1787872314453125, -0.120941162109375, -0.0630950927734375, -0.0052490234375, 0.0525970458984375, 0.110443115234375, 0.1682891845703125, 0.22613525390625, 0.2839813232421875, 0.341827392578125, 0.3996734619140625, 0.45751953125, 0.5153656005859375, 0.573211669921875, 0.6310577392578125, 0.68890380859375, 0.7467498779296875, 0.804595947265625, 0.8624420166015625, 0.9202880859375, 0.9781341552734375, 1.035980224609375, 1.0938262939453125, 1.15167236328125, 1.2095184326171875, 1.267364501953125, 1.3252105712890625, 1.383056640625, 1.4409027099609375, 1.498748779296875, 1.5565948486328125, 1.61444091796875, 1.6722869873046875, 1.730133056640625, 1.7879791259765625, 1.8458251953125, 1.9036712646484375, 1.961517333984375, 2.0193634033203125, 2.07720947265625, 2.1350555419921875, 2.192901611328125, 2.2507476806640625, 2.30859375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 4.0, 4.0, 7.0, 13.0, 9.0, 25.0, 29.0, 30.0, 75.0, 105.0, 281.0, 817.0, 1618.0, 566.0, 200.0, 109.0, 54.0, 32.0, 23.0, 19.0, 14.0, 11.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7158203125, -0.6905136108398438, -0.6652069091796875, -0.6399002075195312, -0.614593505859375, -0.5892868041992188, -0.5639801025390625, -0.5386734008789062, -0.51336669921875, -0.48805999755859375, -0.4627532958984375, -0.43744659423828125, -0.412139892578125, -0.38683319091796875, -0.3615264892578125, -0.33621978759765625, -0.3109130859375, -0.28560638427734375, -0.2602996826171875, -0.23499298095703125, -0.209686279296875, -0.18437957763671875, -0.1590728759765625, -0.13376617431640625, -0.10845947265625, -0.08315277099609375, -0.0578460693359375, -0.03253936767578125, -0.007232666015625, 0.01807403564453125, 0.0433807373046875, 0.06868743896484375, 0.093994140625, 0.11930084228515625, 0.1446075439453125, 0.16991424560546875, 0.195220947265625, 0.22052764892578125, 0.2458343505859375, 0.27114105224609375, 0.29644775390625, 0.32175445556640625, 0.3470611572265625, 0.37236785888671875, 0.397674560546875, 0.42298126220703125, 0.4482879638671875, 0.47359466552734375, 0.4989013671875, 0.5242080688476562, 0.5495147705078125, 0.5748214721679688, 0.600128173828125, 0.6254348754882812, 0.6507415771484375, 0.6760482788085938, 0.70135498046875, 0.7266616821289062, 0.7519683837890625, 0.7772750854492188, 0.802581787109375, 0.8278884887695312, 0.8531951904296875, 0.8785018920898438, 0.90380859375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 11.0, 9.0, 15.0, 32.0, 60.0, 121.0, 163.0, 203.0, 170.0, 99.0, 62.0, 32.0, 15.0, 6.0, 6.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.301664352416992, -3.164907932281494, -3.028151512145996, -2.891395092010498, -2.754638671875, -2.617882251739502, -2.481126070022583, -2.344369649887085, -2.207613229751587, -2.070856809616089, -1.9341003894805908, -1.7973440885543823, -1.6605876684188843, -1.5238312482833862, -1.3870749473571777, -1.2503185272216797, -1.1135621070861816, -0.9768056869506836, -0.8400493264198303, -0.703292965888977, -0.566536545753479, -0.42978012561798096, -0.2930237650871277, -0.15626740455627441, -0.019510984420776367, 0.11724540591239929, 0.25400179624557495, 0.3907581865787506, 0.5275145769119263, 0.6642709970474243, 0.8010273575782776, 0.9377837181091309, 1.074540138244629, 1.211296558380127, 1.348052978515625, 1.4848092794418335, 1.6215656995773315, 1.7583221197128296, 1.895078420639038, 2.031834840774536, 2.168591260910034, 2.3053476810455322, 2.4421041011810303, 2.5788605213165283, 2.7156167030334473, 2.8523731231689453, 2.9891295433044434, 3.1258859634399414, 3.2626423835754395, 3.3993988037109375, 3.5361552238464355, 3.6729116439819336, 3.8096680641174316, 3.9464244842529297, 4.083180904388428, 4.219937324523926, 4.356693267822266, 4.493449687957764, 4.630206108093262, 4.76696252822876, 4.903718948364258, 5.040475368499756, 5.177231788635254, 5.313987731933594, 5.45074462890625]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 4.0, 3.0, 12.0, 16.0, 12.0, 10.0, 17.0, 23.0, 26.0, 21.0, 29.0, 34.0, 29.0, 44.0, 45.0, 45.0, 38.0, 51.0, 46.0, 55.0, 48.0, 48.0, 40.0, 35.0, 38.0, 17.0, 33.0, 35.0, 19.0, 15.0, 16.0, 19.0, 17.0, 16.0, 12.0, 8.0, 7.0, 1.0, 4.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.7056069374084473, -2.6333892345428467, -2.561171531677246, -2.4889540672302246, -2.416736364364624, -2.3445186614990234, -2.272300958633423, -2.2000832557678223, -2.1278655529022217, -2.055647850036621, -1.98343026638031, -1.9112125635147095, -1.8389948606491089, -1.7667772769927979, -1.6945595741271973, -1.6223418712615967, -1.5501242876052856, -1.477906584739685, -1.405689001083374, -1.3334712982177734, -1.2612535953521729, -1.1890358924865723, -1.1168183088302612, -1.0446006059646606, -0.9723829627037048, -0.900165319442749, -0.8279476165771484, -0.7557299733161926, -0.6835123300552368, -0.6112946271896362, -0.5390769839286804, -0.46685928106307983, -0.3946417570114136, -0.3224240839481354, -0.2502064108848572, -0.17798876762390137, -0.10577109456062317, -0.03355342149734497, 0.03866422176361084, 0.11088192462921143, 0.18309956789016724, 0.25531724095344543, 0.32753491401672363, 0.39975255727767944, 0.47197023034095764, 0.5441879034042358, 0.6164055466651917, 0.6886232495307922, 0.760840892791748, 0.8330585360527039, 0.9052762389183044, 0.9774938821792603, 1.0497115850448608, 1.1219291687011719, 1.1941468715667725, 1.266364574432373, 1.3385822772979736, 1.4107999801635742, 1.4830175638198853, 1.5552352666854858, 1.6274529695510864, 1.6996705532073975, 1.771888256072998, 1.8441059589385986, 1.9163235425949097]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 7.0, 8.0, 9.0, 19.0, 26.0, 64.0, 79.0, 136.0, 252.0, 484.0, 1151.0, 3089.0, 10573.0, 55088.0, 465480.0, 443766.0, 52695.0, 10413.0, 3037.0, 1138.0, 436.0, 267.0, 127.0, 72.0, 50.0, 23.0, 21.0, 13.0, 5.0, 5.0, 7.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.875, -2.77227783203125, -2.6695556640625, -2.56683349609375, -2.464111328125, -2.36138916015625, -2.2586669921875, -2.15594482421875, -2.05322265625, -1.95050048828125, -1.8477783203125, -1.74505615234375, -1.642333984375, -1.53961181640625, -1.4368896484375, -1.33416748046875, -1.2314453125, -1.12872314453125, -1.0260009765625, -0.92327880859375, -0.820556640625, -0.71783447265625, -0.6151123046875, -0.51239013671875, -0.40966796875, -0.30694580078125, -0.2042236328125, -0.10150146484375, 0.001220703125, 0.10394287109375, 0.2066650390625, 0.30938720703125, 0.412109375, 0.51483154296875, 0.6175537109375, 0.72027587890625, 0.822998046875, 0.92572021484375, 1.0284423828125, 1.13116455078125, 1.23388671875, 1.33660888671875, 1.4393310546875, 1.54205322265625, 1.644775390625, 1.74749755859375, 1.8502197265625, 1.95294189453125, 2.0556640625, 2.15838623046875, 2.2611083984375, 2.36383056640625, 2.466552734375, 2.56927490234375, 2.6719970703125, 2.77471923828125, 2.87744140625, 2.98016357421875, 3.0828857421875, 3.18560791015625, 3.288330078125, 3.39105224609375, 3.4937744140625, 3.59649658203125, 3.69921875]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 6.0, 14.0, 12.0, 30.0, 41.0, 60.0, 75.0, 74.0, 86.0, 85.0, 76.0, 86.0, 95.0, 63.0, 48.0, 40.0, 36.0, 23.0, 15.0, 14.0, 7.0, 6.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7266769409179688, -0.6940765380859375, -0.6614761352539062, -0.628875732421875, -0.5962753295898438, -0.5636749267578125, -0.5310745239257812, -0.49847412109375, -0.46587371826171875, -0.4332733154296875, -0.40067291259765625, -0.368072509765625, -0.33547210693359375, -0.3028717041015625, -0.27027130126953125, -0.2376708984375, -0.20507049560546875, -0.1724700927734375, -0.13986968994140625, -0.107269287109375, -0.07466888427734375, -0.0420684814453125, -0.00946807861328125, 0.02313232421875, 0.05573272705078125, 0.0883331298828125, 0.12093353271484375, 0.153533935546875, 0.18613433837890625, 0.2187347412109375, 0.25133514404296875, 0.283935546875, 0.31653594970703125, 0.3491363525390625, 0.38173675537109375, 0.414337158203125, 0.44693756103515625, 0.4795379638671875, 0.5121383666992188, 0.54473876953125, 0.5773391723632812, 0.6099395751953125, 0.6425399780273438, 0.675140380859375, 0.7077407836914062, 0.7403411865234375, 0.7729415893554688, 0.8055419921875, 0.8381423950195312, 0.8707427978515625, 0.9033432006835938, 0.935943603515625, 0.9685440063476562, 1.0011444091796875, 1.0337448120117188, 1.06634521484375, 1.0989456176757812, 1.1315460205078125, 1.1641464233398438, 1.196746826171875, 1.2293472290039062, 1.2619476318359375, 1.2945480346679688, 1.3271484375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 6.0, 7.0, 9.0, 14.0, 21.0, 37.0, 36.0, 56.0, 88.0, 130.0, 199.0, 337.0, 601.0, 1240.0, 2992.0, 8118.0, 25620.0, 96404.0, 369101.0, 394778.0, 105656.0, 28277.0, 8718.0, 3106.0, 1286.0, 655.0, 384.0, 208.0, 149.0, 96.0, 66.0, 52.0, 36.0, 22.0, 17.0, 18.0, 2.0, 7.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6337890625, -1.5793914794921875, -1.524993896484375, -1.4705963134765625, -1.41619873046875, -1.3618011474609375, -1.307403564453125, -1.2530059814453125, -1.1986083984375, -1.1442108154296875, -1.089813232421875, -1.0354156494140625, -0.98101806640625, -0.9266204833984375, -0.872222900390625, -0.8178253173828125, -0.763427734375, -0.7090301513671875, -0.654632568359375, -0.6002349853515625, -0.54583740234375, -0.4914398193359375, -0.437042236328125, -0.3826446533203125, -0.3282470703125, -0.2738494873046875, -0.219451904296875, -0.1650543212890625, -0.11065673828125, -0.0562591552734375, -0.001861572265625, 0.0525360107421875, 0.10693359375, 0.1613311767578125, 0.215728759765625, 0.2701263427734375, 0.32452392578125, 0.3789215087890625, 0.433319091796875, 0.4877166748046875, 0.5421142578125, 0.5965118408203125, 0.650909423828125, 0.7053070068359375, 0.75970458984375, 0.8141021728515625, 0.868499755859375, 0.9228973388671875, 0.977294921875, 1.0316925048828125, 1.086090087890625, 1.1404876708984375, 1.19488525390625, 1.2492828369140625, 1.303680419921875, 1.3580780029296875, 1.4124755859375, 1.4668731689453125, 1.521270751953125, 1.5756683349609375, 1.63006591796875, 1.6844635009765625, 1.738861083984375, 1.7932586669921875, 1.84765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0, 2.0, 4.0, 9.0, 5.0, 8.0, 9.0, 14.0, 10.0, 13.0, 22.0, 20.0, 16.0, 26.0, 27.0, 37.0, 39.0, 31.0, 41.0, 39.0, 50.0, 39.0, 43.0, 43.0, 37.0, 33.0, 44.0, 33.0, 34.0, 23.0, 22.0, 35.0, 28.0, 22.0, 16.0, 24.0, 17.0, 22.0, 13.0, 6.0, 10.0, 10.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 5.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.9580078125, -1.8949737548828125, -1.831939697265625, -1.7689056396484375, -1.70587158203125, -1.6428375244140625, -1.579803466796875, -1.5167694091796875, -1.4537353515625, -1.3907012939453125, -1.327667236328125, -1.2646331787109375, -1.20159912109375, -1.1385650634765625, -1.075531005859375, -1.0124969482421875, -0.949462890625, -0.8864288330078125, -0.823394775390625, -0.7603607177734375, -0.69732666015625, -0.6342926025390625, -0.571258544921875, -0.5082244873046875, -0.4451904296875, -0.3821563720703125, -0.319122314453125, -0.2560882568359375, -0.19305419921875, -0.1300201416015625, -0.066986083984375, -0.0039520263671875, 0.05908203125, 0.1221160888671875, 0.185150146484375, 0.2481842041015625, 0.31121826171875, 0.3742523193359375, 0.437286376953125, 0.5003204345703125, 0.5633544921875, 0.6263885498046875, 0.689422607421875, 0.7524566650390625, 0.81549072265625, 0.8785247802734375, 0.941558837890625, 1.0045928955078125, 1.067626953125, 1.1306610107421875, 1.193695068359375, 1.2567291259765625, 1.31976318359375, 1.3827972412109375, 1.445831298828125, 1.5088653564453125, 1.5718994140625, 1.6349334716796875, 1.697967529296875, 1.7610015869140625, 1.82403564453125, 1.8870697021484375, 1.950103759765625, 2.0131378173828125, 2.076171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 6.0, 4.0, 8.0, 14.0, 25.0, 29.0, 77.0, 148.0, 278.0, 693.0, 2203.0, 10277.0, 75883.0, 770965.0, 164917.0, 18016.0, 3356.0, 923.0, 368.0, 133.0, 102.0, 44.0, 29.0, 13.0, 17.0, 9.0, 7.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72900390625, -0.7016525268554688, -0.6743011474609375, -0.6469497680664062, -0.619598388671875, -0.5922470092773438, -0.5648956298828125, -0.5375442504882812, -0.51019287109375, -0.48284149169921875, -0.4554901123046875, -0.42813873291015625, -0.400787353515625, -0.37343597412109375, -0.3460845947265625, -0.31873321533203125, -0.2913818359375, -0.26403045654296875, -0.2366790771484375, -0.20932769775390625, -0.181976318359375, -0.15462493896484375, -0.1272735595703125, -0.09992218017578125, -0.07257080078125, -0.04521942138671875, -0.0178680419921875, 0.00948333740234375, 0.036834716796875, 0.06418609619140625, 0.0915374755859375, 0.11888885498046875, 0.146240234375, 0.17359161376953125, 0.2009429931640625, 0.22829437255859375, 0.255645751953125, 0.28299713134765625, 0.3103485107421875, 0.33769989013671875, 0.36505126953125, 0.39240264892578125, 0.4197540283203125, 0.44710540771484375, 0.474456787109375, 0.5018081665039062, 0.5291595458984375, 0.5565109252929688, 0.5838623046875, 0.6112136840820312, 0.6385650634765625, 0.6659164428710938, 0.693267822265625, 0.7206192016601562, 0.7479705810546875, 0.7753219604492188, 0.80267333984375, 0.8300247192382812, 0.8573760986328125, 0.8847274780273438, 0.912078857421875, 0.9394302368164062, 0.9667816162109375, 0.9941329956054688, 1.021484375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 3.0, 6.0, 5.0, 5.0, 8.0, 8.0, 10.0, 15.0, 14.0, 13.0, 15.0, 32.0, 51.0, 76.0, 98.0, 133.0, 126.0, 102.0, 69.0, 42.0, 29.0, 22.0, 18.0, 13.0, 21.0, 15.0, 5.0, 8.0, 5.0, 9.0, 7.0, 8.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00012803077697753906, -0.00012412946671247482, -0.00012022815644741058, -0.00011632684618234634, -0.0001124255359172821, -0.00010852422565221786, -0.00010462291538715363, -0.00010072160512208939, -9.682029485702515e-05, -9.291898459196091e-05, -8.901767432689667e-05, -8.511636406183243e-05, -8.121505379676819e-05, -7.731374353170395e-05, -7.341243326663971e-05, -6.951112300157547e-05, -6.560981273651123e-05, -6.170850247144699e-05, -5.780719220638275e-05, -5.390588194131851e-05, -5.000457167625427e-05, -4.610326141119003e-05, -4.2201951146125793e-05, -3.8300640881061554e-05, -3.4399330615997314e-05, -3.0498020350933075e-05, -2.6596710085868835e-05, -2.2695399820804596e-05, -1.8794089555740356e-05, -1.4892779290676117e-05, -1.0991469025611877e-05, -7.090158760547638e-06, -3.1888484954833984e-06, 7.124617695808411e-07, 4.6137720346450806e-06, 8.51508229970932e-06, 1.241639256477356e-05, 1.63177028298378e-05, 2.021901309490204e-05, 2.4120323359966278e-05, 2.8021633625030518e-05, 3.192294389009476e-05, 3.5824254155158997e-05, 3.9725564420223236e-05, 4.3626874685287476e-05, 4.7528184950351715e-05, 5.1429495215415955e-05, 5.5330805480480194e-05, 5.9232115745544434e-05, 6.313342601060867e-05, 6.703473627567291e-05, 7.093604654073715e-05, 7.483735680580139e-05, 7.873866707086563e-05, 8.263997733592987e-05, 8.654128760099411e-05, 9.044259786605835e-05, 9.434390813112259e-05, 9.824521839618683e-05, 0.00010214652866125107, 0.00010604783892631531, 0.00010994914919137955, 0.00011385045945644379, 0.00011775176972150803, 0.00012165307998657227]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 7.0, 6.0, 10.0, 8.0, 11.0, 22.0, 37.0, 44.0, 54.0, 86.0, 138.0, 189.0, 331.0, 559.0, 1010.0, 2100.0, 4587.0, 12620.0, 38221.0, 144439.0, 613078.0, 165587.0, 41981.0, 13693.0, 5054.0, 2088.0, 1003.0, 569.0, 351.0, 203.0, 139.0, 100.0, 76.0, 38.0, 36.0, 31.0, 16.0, 9.0, 9.0, 4.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.491943359375, -0.4758338928222656, -0.45972442626953125, -0.4436149597167969, -0.4275054931640625, -0.4113960266113281, -0.39528656005859375, -0.3791770935058594, -0.363067626953125, -0.3469581604003906, -0.33084869384765625, -0.3147392272949219, -0.2986297607421875, -0.2825202941894531, -0.26641082763671875, -0.2503013610839844, -0.23419189453125, -0.21808242797851562, -0.20197296142578125, -0.18586349487304688, -0.1697540283203125, -0.15364456176757812, -0.13753509521484375, -0.12142562866210938, -0.105316162109375, -0.08920669555664062, -0.07309722900390625, -0.056987762451171875, -0.0408782958984375, -0.024768829345703125, -0.00865936279296875, 0.007450103759765625, 0.0235595703125, 0.039669036865234375, 0.05577850341796875, 0.07188796997070312, 0.0879974365234375, 0.10410690307617188, 0.12021636962890625, 0.13632583618164062, 0.152435302734375, 0.16854476928710938, 0.18465423583984375, 0.20076370239257812, 0.2168731689453125, 0.23298263549804688, 0.24909210205078125, 0.2652015686035156, 0.28131103515625, 0.2974205017089844, 0.31352996826171875, 0.3296394348144531, 0.3457489013671875, 0.3618583679199219, 0.37796783447265625, 0.3940773010253906, 0.410186767578125, 0.4262962341308594, 0.44240570068359375, 0.4585151672363281, 0.4746246337890625, 0.4907341003417969, 0.5068435668945312, 0.5229530334472656, 0.5390625]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 5.0, 8.0, 6.0, 9.0, 15.0, 15.0, 18.0, 28.0, 27.0, 50.0, 53.0, 84.0, 74.0, 100.0, 77.0, 81.0, 57.0, 65.0, 46.0, 41.0, 23.0, 25.0, 21.0, 11.0, 10.0, 5.0, 8.0, 7.0, 5.0, 2.0, 3.0, 0.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39111328125, -0.3760528564453125, -0.360992431640625, -0.3459320068359375, -0.33087158203125, -0.3158111572265625, -0.300750732421875, -0.2856903076171875, -0.2706298828125, -0.2555694580078125, -0.240509033203125, -0.2254486083984375, -0.21038818359375, -0.1953277587890625, -0.180267333984375, -0.1652069091796875, -0.150146484375, -0.1350860595703125, -0.120025634765625, -0.1049652099609375, -0.08990478515625, -0.0748443603515625, -0.059783935546875, -0.0447235107421875, -0.0296630859375, -0.0146026611328125, 0.000457763671875, 0.0155181884765625, 0.03057861328125, 0.0456390380859375, 0.060699462890625, 0.0757598876953125, 0.0908203125, 0.1058807373046875, 0.120941162109375, 0.1360015869140625, 0.15106201171875, 0.1661224365234375, 0.181182861328125, 0.1962432861328125, 0.2113037109375, 0.2263641357421875, 0.241424560546875, 0.2564849853515625, 0.27154541015625, 0.2866058349609375, 0.301666259765625, 0.3167266845703125, 0.331787109375, 0.3468475341796875, 0.361907958984375, 0.3769683837890625, 0.39202880859375, 0.4070892333984375, 0.422149658203125, 0.4372100830078125, 0.4522705078125, 0.4673309326171875, 0.482391357421875, 0.4974517822265625, 0.51251220703125, 0.5275726318359375, 0.542633056640625, 0.5576934814453125, 0.57275390625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 4.0, 11.0, 47.0, 145.0, 277.0, 298.0, 154.0, 40.0, 19.0, 7.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.471875190734863, -12.680070877075195, -11.888266563415527, -11.09646224975586, -10.304656982421875, -9.512852668762207, -8.721048355102539, -7.929243564605713, -7.137439250946045, -6.345634937286377, -5.553830146789551, -4.762025833129883, -3.9702212810516357, -3.1784167289733887, -2.3866124153137207, -1.5948076248168945, -0.8030033111572266, -0.011198818683624268, 0.780605673789978, 1.5724101066589355, 2.3642146587371826, 3.1560192108154297, 3.9478235244750977, 4.739628314971924, 5.531432628631592, 6.32323694229126, 7.115041732788086, 7.906846046447754, 8.698650360107422, 9.490455627441406, 10.282258987426758, 11.074064254760742, 11.865869522094727, 12.657673835754395, 13.449478149414062, 14.241283416748047, 15.033087730407715, 15.824892044067383, 16.616695404052734, 17.40850067138672, 18.200305938720703, 18.992111206054688, 19.78391456604004, 20.575719833374023, 21.367523193359375, 22.15932846069336, 22.951133728027344, 23.742937088012695, 24.534740447998047, 25.32654571533203, 26.118349075317383, 26.910154342651367, 27.70195770263672, 28.493762969970703, 29.285568237304688, 30.07737159729004, 30.869176864624023, 31.660982131958008, 32.45278549194336, 33.244590759277344, 34.03639602661133, 34.82820129394531, 35.62000274658203, 36.411808013916016, 37.20361328125]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 6.0, 1.0, 6.0, 9.0, 3.0, 12.0, 22.0, 12.0, 15.0, 24.0, 28.0, 20.0, 32.0, 30.0, 36.0, 45.0, 36.0, 52.0, 34.0, 54.0, 37.0, 47.0, 42.0, 32.0, 43.0, 54.0, 37.0, 34.0, 29.0, 33.0, 27.0, 22.0, 20.0, 5.0, 11.0, 17.0, 12.0, 4.0, 10.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-11.764881134033203, -11.405776977539062, -11.046672821044922, -10.687568664550781, -10.32846450805664, -9.9693603515625, -9.61025619506836, -9.251152038574219, -8.892047882080078, -8.532943725585938, -8.173839569091797, -7.814735412597656, -7.455631256103516, -7.096527099609375, -6.737423419952393, -6.378319263458252, -6.0192155838012695, -5.660111427307129, -5.301007270812988, -4.941903114318848, -4.582798957824707, -4.223694801330566, -3.864591121673584, -3.5054869651794434, -3.1463828086853027, -2.787278652191162, -2.4281744956970215, -2.06907057762146, -1.7099664211273193, -1.3508622646331787, -0.9917583465576172, -0.6326541900634766, -0.27355003356933594, 0.08555406332015991, 0.44465816020965576, 0.8037621974945068, 1.1628663539886475, 1.521970510482788, 1.8810744285583496, 2.2401785850524902, 2.599282741546631, 2.9583868980407715, 3.317491054534912, 3.6765949726104736, 4.035698890686035, 4.394803047180176, 4.753907203674316, 5.113011360168457, 5.472115516662598, 5.831219673156738, 6.190323829650879, 6.5494279861450195, 6.90853214263916, 7.267636299133301, 7.626739978790283, 7.985844135284424, 8.344947814941406, 8.704051971435547, 9.063156127929688, 9.422260284423828, 9.781364440917969, 10.14046859741211, 10.49957275390625, 10.85867691040039, 11.217781066894531]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 5.0, 7.0, 9.0, 8.0, 13.0, 25.0, 36.0, 46.0, 74.0, 121.0, 230.0, 401.0, 744.0, 1533.0, 3426.0, 8727.0, 30145.0, 250750.0, 3770472.0, 96951.0, 18346.0, 6154.0, 2663.0, 1278.0, 716.0, 440.0, 279.0, 183.0, 123.0, 104.0, 58.0, 48.0, 34.0, 26.0, 23.0, 19.0, 21.0, 11.0, 8.0, 10.0, 5.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.5947265625, -1.5317840576171875, -1.468841552734375, -1.4058990478515625, -1.34295654296875, -1.2800140380859375, -1.217071533203125, -1.1541290283203125, -1.0911865234375, -1.0282440185546875, -0.965301513671875, -0.9023590087890625, -0.83941650390625, -0.7764739990234375, -0.713531494140625, -0.6505889892578125, -0.587646484375, -0.5247039794921875, -0.461761474609375, -0.3988189697265625, -0.33587646484375, -0.2729339599609375, -0.209991455078125, -0.1470489501953125, -0.0841064453125, -0.0211639404296875, 0.041778564453125, 0.1047210693359375, 0.16766357421875, 0.2306060791015625, 0.293548583984375, 0.3564910888671875, 0.41943359375, 0.4823760986328125, 0.545318603515625, 0.6082611083984375, 0.67120361328125, 0.7341461181640625, 0.797088623046875, 0.8600311279296875, 0.9229736328125, 0.9859161376953125, 1.048858642578125, 1.1118011474609375, 1.17474365234375, 1.2376861572265625, 1.300628662109375, 1.3635711669921875, 1.426513671875, 1.4894561767578125, 1.552398681640625, 1.6153411865234375, 1.67828369140625, 1.7412261962890625, 1.804168701171875, 1.8671112060546875, 1.9300537109375, 1.9929962158203125, 2.055938720703125, 2.1188812255859375, 2.18182373046875, 2.2447662353515625, 2.307708740234375, 2.3706512451171875, 2.43359375]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 4.0, 11.0, 12.0, 16.0, 23.0, 40.0, 51.0, 54.0, 73.0, 68.0, 76.0, 83.0, 76.0, 93.0, 55.0, 61.0, 56.0, 48.0, 28.0, 26.0, 14.0, 9.0, 11.0, 7.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73291015625, -0.7010269165039062, -0.6691436767578125, -0.6372604370117188, -0.605377197265625, -0.5734939575195312, -0.5416107177734375, -0.5097274780273438, -0.47784423828125, -0.44596099853515625, -0.4140777587890625, -0.38219451904296875, -0.350311279296875, -0.31842803955078125, -0.2865447998046875, -0.25466156005859375, -0.2227783203125, -0.19089508056640625, -0.1590118408203125, -0.12712860107421875, -0.095245361328125, -0.06336212158203125, -0.0314788818359375, 0.00040435791015625, 0.03228759765625, 0.06417083740234375, 0.0960540771484375, 0.12793731689453125, 0.159820556640625, 0.19170379638671875, 0.2235870361328125, 0.25547027587890625, 0.287353515625, 0.31923675537109375, 0.3511199951171875, 0.38300323486328125, 0.414886474609375, 0.44676971435546875, 0.4786529541015625, 0.5105361938476562, 0.54241943359375, 0.5743026733398438, 0.6061859130859375, 0.6380691528320312, 0.669952392578125, 0.7018356323242188, 0.7337188720703125, 0.7656021118164062, 0.7974853515625, 0.8293685913085938, 0.8612518310546875, 0.8931350708007812, 0.925018310546875, 0.9569015502929688, 0.9887847900390625, 1.0206680297851562, 1.05255126953125, 1.0844345092773438, 1.1163177490234375, 1.1482009887695312, 1.180084228515625, 1.2119674682617188, 1.2438507080078125, 1.2757339477539062, 1.3076171875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 6.0, 2.0, 4.0, 6.0, 4.0, 9.0, 10.0, 17.0, 25.0, 28.0, 43.0, 69.0, 89.0, 177.0, 307.0, 545.0, 1067.0, 2244.0, 4814.0, 12116.0, 41966.0, 376897.0, 3533206.0, 174975.0, 28833.0, 9423.0, 3768.0, 1681.0, 806.0, 428.0, 262.0, 156.0, 98.0, 63.0, 50.0, 29.0, 21.0, 14.0, 7.0, 7.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2314453125, -1.1921844482421875, -1.152923583984375, -1.1136627197265625, -1.07440185546875, -1.0351409912109375, -0.995880126953125, -0.9566192626953125, -0.9173583984375, -0.8780975341796875, -0.838836669921875, -0.7995758056640625, -0.76031494140625, -0.7210540771484375, -0.681793212890625, -0.6425323486328125, -0.603271484375, -0.5640106201171875, -0.524749755859375, -0.4854888916015625, -0.44622802734375, -0.4069671630859375, -0.367706298828125, -0.3284454345703125, -0.2891845703125, -0.2499237060546875, -0.210662841796875, -0.1714019775390625, -0.13214111328125, -0.0928802490234375, -0.053619384765625, -0.0143585205078125, 0.02490234375, 0.0641632080078125, 0.103424072265625, 0.1426849365234375, 0.18194580078125, 0.2212066650390625, 0.260467529296875, 0.2997283935546875, 0.3389892578125, 0.3782501220703125, 0.417510986328125, 0.4567718505859375, 0.49603271484375, 0.5352935791015625, 0.574554443359375, 0.6138153076171875, 0.653076171875, 0.6923370361328125, 0.731597900390625, 0.7708587646484375, 0.81011962890625, 0.8493804931640625, 0.888641357421875, 0.9279022216796875, 0.9671630859375, 1.0064239501953125, 1.045684814453125, 1.0849456787109375, 1.12420654296875, 1.1634674072265625, 1.202728271484375, 1.2419891357421875, 1.28125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 5.0, 4.0, 3.0, 10.0, 9.0, 8.0, 15.0, 15.0, 29.0, 70.0, 144.0, 389.0, 1937.0, 938.0, 257.0, 111.0, 36.0, 34.0, 22.0, 10.0, 12.0, 9.0, 4.0, 5.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.61865234375, -0.5936660766601562, -0.5686798095703125, -0.5436935424804688, -0.518707275390625, -0.49372100830078125, -0.4687347412109375, -0.44374847412109375, -0.41876220703125, -0.39377593994140625, -0.3687896728515625, -0.34380340576171875, -0.318817138671875, -0.29383087158203125, -0.2688446044921875, -0.24385833740234375, -0.2188720703125, -0.19388580322265625, -0.1688995361328125, -0.14391326904296875, -0.118927001953125, -0.09394073486328125, -0.0689544677734375, -0.04396820068359375, -0.01898193359375, 0.00600433349609375, 0.0309906005859375, 0.05597686767578125, 0.080963134765625, 0.10594940185546875, 0.1309356689453125, 0.15592193603515625, 0.180908203125, 0.20589447021484375, 0.2308807373046875, 0.25586700439453125, 0.280853271484375, 0.30583953857421875, 0.3308258056640625, 0.35581207275390625, 0.38079833984375, 0.40578460693359375, 0.4307708740234375, 0.45575714111328125, 0.480743408203125, 0.5057296752929688, 0.5307159423828125, 0.5557022094726562, 0.5806884765625, 0.6056747436523438, 0.6306610107421875, 0.6556472778320312, 0.680633544921875, 0.7056198120117188, 0.7306060791015625, 0.7555923461914062, 0.78057861328125, 0.8055648803710938, 0.8305511474609375, 0.8555374145507812, 0.880523681640625, 0.9055099487304688, 0.9304962158203125, 0.9554824829101562, 0.98046875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 14.0, 25.0, 60.0, 110.0, 190.0, 252.0, 175.0, 95.0, 44.0, 19.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.564066171646118, -3.422619581222534, -3.281172752380371, -3.139726161956787, -2.998279333114624, -2.85683274269104, -2.715385913848877, -2.573939323425293, -2.432492733001709, -2.291046142578125, -2.149599313735962, -2.008152723312378, -1.8667058944702148, -1.7252593040466309, -1.5838125944137573, -1.4423658847808838, -1.3009190559387207, -1.1594723463058472, -1.0180256366729736, -0.8765789866447449, -0.7351322770118713, -0.5936855673789978, -0.45223891735076904, -0.3107922077178955, -0.16934549808502197, -0.02789880335330963, 0.11354789137840271, 0.25499457120895386, 0.3964412808418274, 0.5378879904747009, 0.6793346405029297, 0.8207813501358032, 0.9622282981872559, 1.1036750078201294, 1.245121717453003, 1.386568307876587, 1.52801513671875, 1.669461727142334, 1.8109084367752075, 1.952355146408081, 2.093801975250244, 2.235248565673828, 2.376695394515991, 2.518141984939575, 2.6595888137817383, 2.8010354042053223, 2.9424819946289062, 3.0839288234710693, 3.2253754138946533, 3.3668220043182373, 3.5082688331604004, 3.6497154235839844, 3.7911622524261475, 3.9326088428497314, 4.0740556716918945, 4.2155022621154785, 4.3569488525390625, 4.4983954429626465, 4.6398420333862305, 4.781289100646973, 4.922735691070557, 5.064182281494141, 5.205628871917725, 5.347075462341309, 5.488522529602051]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 12.0, 11.0, 21.0, 26.0, 21.0, 30.0, 25.0, 40.0, 50.0, 56.0, 69.0, 50.0, 59.0, 58.0, 63.0, 69.0, 72.0, 55.0, 44.0, 31.0, 30.0, 26.0, 19.0, 20.0, 10.0, 6.0, 9.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.643740653991699, -2.5649056434631348, -2.4860706329345703, -2.407235622406006, -2.3284003734588623, -2.249565362930298, -2.1707303524017334, -2.091895341873169, -2.0130603313446045, -1.93422532081604, -1.855390191078186, -1.7765551805496216, -1.6977201700210571, -1.6188850402832031, -1.5400500297546387, -1.4612150192260742, -1.3823798894882202, -1.3035448789596558, -1.2247097492218018, -1.1458747386932373, -1.0670397281646729, -0.9882046580314636, -0.9093695878982544, -0.8305345773696899, -0.7516995072364807, -0.6728644371032715, -0.594029426574707, -0.5151943564414978, -0.43635931611061096, -0.3575242757797241, -0.2786892056465149, -0.19985419511795044, -0.12101912498474121, -0.04218407720327377, 0.036650970578193665, 0.1154860258102417, 0.19432106614112854, 0.2731561064720154, 0.3519911766052246, 0.43082618713378906, 0.5096612572669983, 0.5884963274002075, 0.667331337928772, 0.7461664080619812, 0.8250014781951904, 0.9038364887237549, 0.9826715588569641, 1.0615065097808838, 1.1403416395187378, 1.2191766500473022, 1.2980117797851562, 1.3768467903137207, 1.4556818008422852, 1.5345168113708496, 1.6133519411087036, 1.692186951637268, 1.771022081375122, 1.8498570919036865, 1.9286922216415405, 2.0075273513793945, 2.086362361907959, 2.1651973724365234, 2.244032382965088, 2.3228673934936523, 2.401702404022217]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 6.0, 3.0, 13.0, 10.0, 23.0, 26.0, 54.0, 97.0, 137.0, 211.0, 408.0, 743.0, 1688.0, 4598.0, 16029.0, 70432.0, 375224.0, 460664.0, 89133.0, 19740.0, 5445.0, 1950.0, 820.0, 401.0, 254.0, 158.0, 103.0, 58.0, 42.0, 28.0, 19.0, 11.0, 10.0, 8.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.01953125, -1.94207763671875, -1.8646240234375, -1.78717041015625, -1.709716796875, -1.63226318359375, -1.5548095703125, -1.47735595703125, -1.39990234375, -1.32244873046875, -1.2449951171875, -1.16754150390625, -1.090087890625, -1.01263427734375, -0.9351806640625, -0.85772705078125, -0.7802734375, -0.70281982421875, -0.6253662109375, -0.54791259765625, -0.470458984375, -0.39300537109375, -0.3155517578125, -0.23809814453125, -0.16064453125, -0.08319091796875, -0.0057373046875, 0.07171630859375, 0.149169921875, 0.22662353515625, 0.3040771484375, 0.38153076171875, 0.458984375, 0.53643798828125, 0.6138916015625, 0.69134521484375, 0.768798828125, 0.84625244140625, 0.9237060546875, 1.00115966796875, 1.07861328125, 1.15606689453125, 1.2335205078125, 1.31097412109375, 1.388427734375, 1.46588134765625, 1.5433349609375, 1.62078857421875, 1.6982421875, 1.77569580078125, 1.8531494140625, 1.93060302734375, 2.008056640625, 2.08551025390625, 2.1629638671875, 2.24041748046875, 2.31787109375, 2.39532470703125, 2.4727783203125, 2.55023193359375, 2.627685546875, 2.70513916015625, 2.7825927734375, 2.86004638671875, 2.9375]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 17.0, 21.0, 30.0, 44.0, 45.0, 59.0, 64.0, 81.0, 74.0, 76.0, 80.0, 77.0, 63.0, 53.0, 55.0, 43.0, 27.0, 22.0, 17.0, 15.0, 12.0, 8.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72998046875, -0.6992874145507812, -0.6685943603515625, -0.6379013061523438, -0.607208251953125, -0.5765151977539062, -0.5458221435546875, -0.5151290893554688, -0.48443603515625, -0.45374298095703125, -0.4230499267578125, -0.39235687255859375, -0.361663818359375, -0.33097076416015625, -0.3002777099609375, -0.26958465576171875, -0.2388916015625, -0.20819854736328125, -0.1775054931640625, -0.14681243896484375, -0.116119384765625, -0.08542633056640625, -0.0547332763671875, -0.02404022216796875, 0.00665283203125, 0.03734588623046875, 0.0680389404296875, 0.09873199462890625, 0.129425048828125, 0.16011810302734375, 0.1908111572265625, 0.22150421142578125, 0.252197265625, 0.28289031982421875, 0.3135833740234375, 0.34427642822265625, 0.374969482421875, 0.40566253662109375, 0.4363555908203125, 0.46704864501953125, 0.49774169921875, 0.5284347534179688, 0.5591278076171875, 0.5898208618164062, 0.620513916015625, 0.6512069702148438, 0.6819000244140625, 0.7125930786132812, 0.7432861328125, 0.7739791870117188, 0.8046722412109375, 0.8353652954101562, 0.866058349609375, 0.8967514038085938, 0.9274444580078125, 0.9581375122070312, 0.98883056640625, 1.0195236206054688, 1.0502166748046875, 1.0809097290039062, 1.111602783203125, 1.1422958374023438, 1.1729888916015625, 1.2036819458007812, 1.234375]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 8.0, 9.0, 9.0, 22.0, 21.0, 29.0, 55.0, 62.0, 106.0, 147.0, 220.0, 369.0, 712.0, 1445.0, 3211.0, 7463.0, 18239.0, 48181.0, 140530.0, 378642.0, 290979.0, 98978.0, 34658.0, 13711.0, 5664.0, 2407.0, 1172.0, 576.0, 302.0, 200.0, 108.0, 80.0, 67.0, 31.0, 42.0, 20.0, 13.0, 18.0, 6.0, 4.0, 10.0, 5.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0], "bins": [-1.375, -1.3331298828125, -1.291259765625, -1.2493896484375, -1.20751953125, -1.1656494140625, -1.123779296875, -1.0819091796875, -1.0400390625, -0.9981689453125, -0.956298828125, -0.9144287109375, -0.87255859375, -0.8306884765625, -0.788818359375, -0.7469482421875, -0.705078125, -0.6632080078125, -0.621337890625, -0.5794677734375, -0.53759765625, -0.4957275390625, -0.453857421875, -0.4119873046875, -0.3701171875, -0.3282470703125, -0.286376953125, -0.2445068359375, -0.20263671875, -0.1607666015625, -0.118896484375, -0.0770263671875, -0.03515625, 0.0067138671875, 0.048583984375, 0.0904541015625, 0.13232421875, 0.1741943359375, 0.216064453125, 0.2579345703125, 0.2998046875, 0.3416748046875, 0.383544921875, 0.4254150390625, 0.46728515625, 0.5091552734375, 0.551025390625, 0.5928955078125, 0.634765625, 0.6766357421875, 0.718505859375, 0.7603759765625, 0.80224609375, 0.8441162109375, 0.885986328125, 0.9278564453125, 0.9697265625, 1.0115966796875, 1.053466796875, 1.0953369140625, 1.13720703125, 1.1790771484375, 1.220947265625, 1.2628173828125, 1.3046875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 7.0, 12.0, 14.0, 7.0, 21.0, 17.0, 23.0, 15.0, 24.0, 21.0, 35.0, 21.0, 34.0, 30.0, 38.0, 47.0, 39.0, 43.0, 44.0, 40.0, 43.0, 36.0, 45.0, 42.0, 38.0, 40.0, 34.0, 30.0, 23.0, 23.0, 23.0, 16.0, 12.0, 7.0, 11.0, 9.0, 3.0, 5.0, 6.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.078125, -2.012298583984375, -1.94647216796875, -1.880645751953125, -1.8148193359375, -1.748992919921875, -1.68316650390625, -1.617340087890625, -1.551513671875, -1.485687255859375, -1.41986083984375, -1.354034423828125, -1.2882080078125, -1.222381591796875, -1.15655517578125, -1.090728759765625, -1.02490234375, -0.959075927734375, -0.89324951171875, -0.827423095703125, -0.7615966796875, -0.695770263671875, -0.62994384765625, -0.564117431640625, -0.498291015625, -0.432464599609375, -0.36663818359375, -0.300811767578125, -0.2349853515625, -0.169158935546875, -0.10333251953125, -0.037506103515625, 0.0283203125, 0.094146728515625, 0.15997314453125, 0.225799560546875, 0.2916259765625, 0.357452392578125, 0.42327880859375, 0.489105224609375, 0.554931640625, 0.620758056640625, 0.68658447265625, 0.752410888671875, 0.8182373046875, 0.884063720703125, 0.94989013671875, 1.015716552734375, 1.08154296875, 1.147369384765625, 1.21319580078125, 1.279022216796875, 1.3448486328125, 1.410675048828125, 1.47650146484375, 1.542327880859375, 1.608154296875, 1.673980712890625, 1.73980712890625, 1.805633544921875, 1.8714599609375, 1.937286376953125, 2.00311279296875, 2.068939208984375, 2.134765625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 7.0, 7.0, 9.0, 22.0, 31.0, 49.0, 104.0, 153.0, 319.0, 663.0, 1415.0, 3557.0, 10826.0, 61152.0, 769355.0, 172464.0, 19248.0, 5387.0, 1995.0, 877.0, 431.0, 202.0, 119.0, 70.0, 36.0, 16.0, 12.0, 7.0, 5.0, 3.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.97314453125, -0.947998046875, -0.9228515625, -0.897705078125, -0.87255859375, -0.847412109375, -0.822265625, -0.797119140625, -0.77197265625, -0.746826171875, -0.7216796875, -0.696533203125, -0.67138671875, -0.646240234375, -0.62109375, -0.595947265625, -0.57080078125, -0.545654296875, -0.5205078125, -0.495361328125, -0.47021484375, -0.445068359375, -0.419921875, -0.394775390625, -0.36962890625, -0.344482421875, -0.3193359375, -0.294189453125, -0.26904296875, -0.243896484375, -0.21875, -0.193603515625, -0.16845703125, -0.143310546875, -0.1181640625, -0.093017578125, -0.06787109375, -0.042724609375, -0.017578125, 0.007568359375, 0.03271484375, 0.057861328125, 0.0830078125, 0.108154296875, 0.13330078125, 0.158447265625, 0.18359375, 0.208740234375, 0.23388671875, 0.259033203125, 0.2841796875, 0.309326171875, 0.33447265625, 0.359619140625, 0.384765625, 0.409912109375, 0.43505859375, 0.460205078125, 0.4853515625, 0.510498046875, 0.53564453125, 0.560791015625, 0.5859375, 0.611083984375, 0.63623046875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 5.0, 8.0, 12.0, 11.0, 7.0, 16.0, 20.0, 32.0, 50.0, 125.0, 232.0, 213.0, 134.0, 64.0, 19.0, 15.0, 19.0, 10.0, 13.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00025081634521484375, -0.00024497322738170624, -0.00023913010954856873, -0.0002332869917154312, -0.0002274438738822937, -0.0002216007560491562, -0.00021575763821601868, -0.00020991452038288116, -0.00020407140254974365, -0.00019822828471660614, -0.00019238516688346863, -0.00018654204905033112, -0.0001806989312171936, -0.0001748558133840561, -0.00016901269555091858, -0.00016316957771778107, -0.00015732645988464355, -0.00015148334205150604, -0.00014564022421836853, -0.00013979710638523102, -0.0001339539885520935, -0.000128110870718956, -0.00012226775288581848, -0.00011642463505268097, -0.00011058151721954346, -0.00010473839938640594, -9.889528155326843e-05, -9.305216372013092e-05, -8.720904588699341e-05, -8.13659280538559e-05, -7.552281022071838e-05, -6.967969238758087e-05, -6.383657455444336e-05, -5.799345672130585e-05, -5.2150338888168335e-05, -4.630722105503082e-05, -4.046410322189331e-05, -3.46209853887558e-05, -2.8777867555618286e-05, -2.2934749722480774e-05, -1.7091631889343262e-05, -1.124851405620575e-05, -5.405396223068237e-06, 4.377216100692749e-07, 6.280839443206787e-06, 1.21239572763443e-05, 1.796707510948181e-05, 2.3810192942619324e-05, 2.9653310775756836e-05, 3.549642860889435e-05, 4.133954644203186e-05, 4.718266427516937e-05, 5.3025782108306885e-05, 5.88688999414444e-05, 6.471201777458191e-05, 7.055513560771942e-05, 7.639825344085693e-05, 8.224137127399445e-05, 8.808448910713196e-05, 9.392760694026947e-05, 9.977072477340698e-05, 0.0001056138426065445, 0.00011145696043968201, 0.00011730007827281952, 0.00012314319610595703]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 4.0, 5.0, 14.0, 22.0, 27.0, 33.0, 59.0, 111.0, 174.0, 297.0, 593.0, 1334.0, 3608.0, 13844.0, 163733.0, 817579.0, 36751.0, 6318.0, 2131.0, 863.0, 408.0, 235.0, 138.0, 70.0, 61.0, 40.0, 35.0, 16.0, 13.0, 12.0, 5.0, 8.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.23046875, -1.1945343017578125, -1.158599853515625, -1.1226654052734375, -1.08673095703125, -1.0507965087890625, -1.014862060546875, -0.9789276123046875, -0.9429931640625, -0.9070587158203125, -0.871124267578125, -0.8351898193359375, -0.79925537109375, -0.7633209228515625, -0.727386474609375, -0.6914520263671875, -0.655517578125, -0.6195831298828125, -0.583648681640625, -0.5477142333984375, -0.51177978515625, -0.4758453369140625, -0.439910888671875, -0.4039764404296875, -0.3680419921875, -0.3321075439453125, -0.296173095703125, -0.2602386474609375, -0.22430419921875, -0.1883697509765625, -0.152435302734375, -0.1165008544921875, -0.08056640625, -0.0446319580078125, -0.008697509765625, 0.0272369384765625, 0.06317138671875, 0.0991058349609375, 0.135040283203125, 0.1709747314453125, 0.2069091796875, 0.2428436279296875, 0.278778076171875, 0.3147125244140625, 0.35064697265625, 0.3865814208984375, 0.422515869140625, 0.4584503173828125, 0.494384765625, 0.5303192138671875, 0.566253662109375, 0.6021881103515625, 0.63812255859375, 0.6740570068359375, 0.709991455078125, 0.7459259033203125, 0.7818603515625, 0.8177947998046875, 0.853729248046875, 0.8896636962890625, 0.92559814453125, 0.9615325927734375, 0.997467041015625, 1.0334014892578125, 1.0693359375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 3.0, 4.0, 4.0, 5.0, 6.0, 8.0, 12.0, 20.0, 22.0, 21.0, 42.0, 58.0, 58.0, 98.0, 147.0, 119.0, 103.0, 57.0, 61.0, 40.0, 33.0, 23.0, 12.0, 12.0, 6.0, 10.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.67919921875, -0.6587295532226562, -0.6382598876953125, -0.6177902221679688, -0.597320556640625, -0.5768508911132812, -0.5563812255859375, -0.5359115600585938, -0.51544189453125, -0.49497222900390625, -0.4745025634765625, -0.45403289794921875, -0.433563232421875, -0.41309356689453125, -0.3926239013671875, -0.37215423583984375, -0.3516845703125, -0.33121490478515625, -0.3107452392578125, -0.29027557373046875, -0.269805908203125, -0.24933624267578125, -0.2288665771484375, -0.20839691162109375, -0.18792724609375, -0.16745758056640625, -0.1469879150390625, -0.12651824951171875, -0.106048583984375, -0.08557891845703125, -0.0651092529296875, -0.04463958740234375, -0.024169921875, -0.00370025634765625, 0.0167694091796875, 0.03723907470703125, 0.057708740234375, 0.07817840576171875, 0.0986480712890625, 0.11911773681640625, 0.13958740234375, 0.16005706787109375, 0.1805267333984375, 0.20099639892578125, 0.221466064453125, 0.24193572998046875, 0.2624053955078125, 0.28287506103515625, 0.3033447265625, 0.32381439208984375, 0.3442840576171875, 0.36475372314453125, 0.385223388671875, 0.40569305419921875, 0.4261627197265625, 0.44663238525390625, 0.46710205078125, 0.48757171630859375, 0.5080413818359375, 0.5285110473632812, 0.548980712890625, 0.5694503784179688, 0.5899200439453125, 0.6103897094726562, 0.630859375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 21.0, 43.0, 113.0, 230.0, 278.0, 193.0, 90.0, 23.0, 10.0, 2.0, 2.0, 1.0, 3.0, 1.0], "bins": [-37.72101974487305, -37.0285530090332, -36.33608627319336, -35.643619537353516, -34.95115280151367, -34.25868606567383, -33.566219329833984, -32.87375259399414, -32.1812858581543, -31.488819122314453, -30.79635238647461, -30.103885650634766, -29.411418914794922, -28.718952178955078, -28.026485443115234, -27.334020614624023, -26.641555786132812, -25.94908905029297, -25.256622314453125, -24.56415557861328, -23.871688842773438, -23.179222106933594, -22.48675537109375, -21.79429054260254, -21.101821899414062, -20.40935516357422, -19.716888427734375, -19.02442169189453, -18.331954956054688, -17.639488220214844, -16.947021484375, -16.25455665588379, -15.562089920043945, -14.869623184204102, -14.177156448364258, -13.484689712524414, -12.792223930358887, -12.099757194519043, -11.4072904586792, -10.714824676513672, -10.022357940673828, -9.329891204833984, -8.63742446899414, -7.944958209991455, -7.2524919509887695, -6.560025215148926, -5.867558479309082, -5.1750922203063965, -4.4826250076293945, -3.79015851020813, -3.0976920127868652, -2.4052252769470215, -1.7127587795257568, -1.0202922821044922, -0.32782554626464844, 0.3646407127380371, 1.0571074485778809, 1.7495739459991455, 2.44204044342041, 3.134507179260254, 3.8269736766815186, 4.519440174102783, 5.211906909942627, 5.9043731689453125, 6.596839904785156]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 4.0, 4.0, 7.0, 11.0, 7.0, 12.0, 13.0, 21.0, 21.0, 21.0, 25.0, 27.0, 33.0, 35.0, 49.0, 42.0, 30.0, 40.0, 40.0, 33.0, 53.0, 47.0, 47.0, 37.0, 36.0, 31.0, 38.0, 37.0, 32.0, 17.0, 27.0, 22.0, 17.0, 18.0, 16.0, 15.0, 7.0, 10.0, 6.0, 1.0, 7.0, 3.0, 1.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.151128768920898, -10.834240913391113, -10.517353057861328, -10.200465202331543, -9.883577346801758, -9.566689491271973, -9.249801635742188, -8.932913780212402, -8.616025924682617, -8.299138069152832, -7.982250213623047, -7.665362358093262, -7.348474502563477, -7.031586647033691, -6.714698791503906, -6.397810935974121, -6.080923080444336, -5.764035224914551, -5.447147369384766, -5.1302595138549805, -4.813371658325195, -4.49648380279541, -4.179595947265625, -3.86270809173584, -3.5458202362060547, -3.2289323806762695, -2.9120445251464844, -2.595156669616699, -2.278268814086914, -1.961380958557129, -1.6444931030273438, -1.3276052474975586, -1.010716438293457, -0.6938285827636719, -0.3769407272338867, -0.06005287170410156, 0.2568349838256836, 0.5737228393554688, 0.8906106948852539, 1.207498550415039, 1.5243864059448242, 1.8412742614746094, 2.1581621170043945, 2.4750499725341797, 2.791937828063965, 3.10882568359375, 3.425713539123535, 3.7426013946533203, 4.0594892501831055, 4.376377105712891, 4.693264961242676, 5.010152816772461, 5.327040672302246, 5.643928527832031, 5.960816383361816, 6.277704238891602, 6.594592094421387, 6.911479949951172, 7.228367805480957, 7.545255661010742, 7.862143516540527, 8.179031372070312, 8.495919227600098, 8.812807083129883, 9.129694938659668]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 6.0, 5.0, 14.0, 15.0, 29.0, 33.0, 99.0, 152.0, 314.0, 606.0, 1327.0, 3473.0, 10777.0, 59730.0, 3908685.0, 181810.0, 18090.0, 5127.0, 1984.0, 846.0, 445.0, 250.0, 173.0, 92.0, 53.0, 45.0, 29.0, 17.0, 10.0, 10.0, 12.0, 11.0, 4.0, 7.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.16796875, -2.076446533203125, -1.98492431640625, -1.893402099609375, -1.8018798828125, -1.710357666015625, -1.61883544921875, -1.527313232421875, -1.435791015625, -1.344268798828125, -1.25274658203125, -1.161224365234375, -1.0697021484375, -0.978179931640625, -0.88665771484375, -0.795135498046875, -0.70361328125, -0.612091064453125, -0.52056884765625, -0.429046630859375, -0.3375244140625, -0.246002197265625, -0.15447998046875, -0.062957763671875, 0.028564453125, 0.120086669921875, 0.21160888671875, 0.303131103515625, 0.3946533203125, 0.486175537109375, 0.57769775390625, 0.669219970703125, 0.7607421875, 0.852264404296875, 0.94378662109375, 1.035308837890625, 1.1268310546875, 1.218353271484375, 1.30987548828125, 1.401397705078125, 1.492919921875, 1.584442138671875, 1.67596435546875, 1.767486572265625, 1.8590087890625, 1.950531005859375, 2.04205322265625, 2.133575439453125, 2.22509765625, 2.316619873046875, 2.40814208984375, 2.499664306640625, 2.5911865234375, 2.682708740234375, 2.77423095703125, 2.865753173828125, 2.957275390625, 3.048797607421875, 3.14031982421875, 3.231842041015625, 3.3233642578125, 3.414886474609375, 3.50640869140625, 3.597930908203125, 3.689453125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 4.0, 3.0, 9.0, 11.0, 14.0, 24.0, 37.0, 36.0, 50.0, 56.0, 66.0, 79.0, 80.0, 83.0, 92.0, 63.0, 88.0, 41.0, 47.0, 39.0, 25.0, 25.0, 18.0, 7.0, 3.0, 6.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7607421875, -0.72833251953125, -0.6959228515625, -0.66351318359375, -0.631103515625, -0.59869384765625, -0.5662841796875, -0.53387451171875, -0.50146484375, -0.46905517578125, -0.4366455078125, -0.40423583984375, -0.371826171875, -0.33941650390625, -0.3070068359375, -0.27459716796875, -0.2421875, -0.20977783203125, -0.1773681640625, -0.14495849609375, -0.112548828125, -0.08013916015625, -0.0477294921875, -0.01531982421875, 0.01708984375, 0.04949951171875, 0.0819091796875, 0.11431884765625, 0.146728515625, 0.17913818359375, 0.2115478515625, 0.24395751953125, 0.2763671875, 0.30877685546875, 0.3411865234375, 0.37359619140625, 0.406005859375, 0.43841552734375, 0.4708251953125, 0.50323486328125, 0.53564453125, 0.56805419921875, 0.6004638671875, 0.63287353515625, 0.665283203125, 0.69769287109375, 0.7301025390625, 0.76251220703125, 0.794921875, 0.82733154296875, 0.8597412109375, 0.89215087890625, 0.924560546875, 0.95697021484375, 0.9893798828125, 1.02178955078125, 1.05419921875, 1.08660888671875, 1.1190185546875, 1.15142822265625, 1.183837890625, 1.21624755859375, 1.2486572265625, 1.28106689453125, 1.3134765625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 0.0, 5.0, 10.0, 7.0, 15.0, 17.0, 24.0, 38.0, 55.0, 98.0, 170.0, 280.0, 493.0, 822.0, 1526.0, 3065.0, 6698.0, 16961.0, 62971.0, 764216.0, 3190845.0, 105889.0, 23992.0, 8468.0, 3751.0, 1793.0, 940.0, 454.0, 261.0, 155.0, 110.0, 54.0, 44.0, 21.0, 10.0, 11.0, 7.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.248046875, -1.2066497802734375, -1.165252685546875, -1.1238555908203125, -1.08245849609375, -1.0410614013671875, -0.999664306640625, -0.9582672119140625, -0.9168701171875, -0.8754730224609375, -0.834075927734375, -0.7926788330078125, -0.75128173828125, -0.7098846435546875, -0.668487548828125, -0.6270904541015625, -0.585693359375, -0.5442962646484375, -0.502899169921875, -0.4615020751953125, -0.42010498046875, -0.3787078857421875, -0.337310791015625, -0.2959136962890625, -0.2545166015625, -0.2131195068359375, -0.171722412109375, -0.1303253173828125, -0.08892822265625, -0.0475311279296875, -0.006134033203125, 0.0352630615234375, 0.07666015625, 0.1180572509765625, 0.159454345703125, 0.2008514404296875, 0.24224853515625, 0.2836456298828125, 0.325042724609375, 0.3664398193359375, 0.4078369140625, 0.4492340087890625, 0.490631103515625, 0.5320281982421875, 0.57342529296875, 0.6148223876953125, 0.656219482421875, 0.6976165771484375, 0.739013671875, 0.7804107666015625, 0.821807861328125, 0.8632049560546875, 0.90460205078125, 0.9459991455078125, 0.987396240234375, 1.0287933349609375, 1.0701904296875, 1.1115875244140625, 1.152984619140625, 1.1943817138671875, 1.23577880859375, 1.2771759033203125, 1.318572998046875, 1.3599700927734375, 1.4013671875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 11.0, 8.0, 15.0, 20.0, 49.0, 76.0, 171.0, 538.0, 2401.0, 449.0, 132.0, 68.0, 52.0, 16.0, 14.0, 12.0, 2.0, 8.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.03515625, -1.0101776123046875, -0.985198974609375, -0.9602203369140625, -0.93524169921875, -0.9102630615234375, -0.885284423828125, -0.8603057861328125, -0.8353271484375, -0.8103485107421875, -0.785369873046875, -0.7603912353515625, -0.73541259765625, -0.7104339599609375, -0.685455322265625, -0.6604766845703125, -0.635498046875, -0.6105194091796875, -0.585540771484375, -0.5605621337890625, -0.53558349609375, -0.5106048583984375, -0.485626220703125, -0.4606475830078125, -0.4356689453125, -0.4106903076171875, -0.385711669921875, -0.3607330322265625, -0.33575439453125, -0.3107757568359375, -0.285797119140625, -0.2608184814453125, -0.23583984375, -0.2108612060546875, -0.185882568359375, -0.1609039306640625, -0.13592529296875, -0.1109466552734375, -0.085968017578125, -0.0609893798828125, -0.0360107421875, -0.0110321044921875, 0.013946533203125, 0.0389251708984375, 0.06390380859375, 0.0888824462890625, 0.113861083984375, 0.1388397216796875, 0.163818359375, 0.1887969970703125, 0.213775634765625, 0.2387542724609375, 0.26373291015625, 0.2887115478515625, 0.313690185546875, 0.3386688232421875, 0.3636474609375, 0.3886260986328125, 0.413604736328125, 0.4385833740234375, 0.46356201171875, 0.4885406494140625, 0.513519287109375, 0.5384979248046875, 0.5634765625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 4.0, 4.0, 10.0, 18.0, 23.0, 49.0, 71.0, 104.0, 133.0, 145.0, 145.0, 111.0, 86.0, 46.0, 19.0, 15.0, 6.0, 8.0, 4.0, 2.0, 1.0, 3.0], "bins": [-4.86213493347168, -4.768665313720703, -4.675195693969727, -4.58172607421875, -4.488256454467773, -4.394786834716797, -4.30131721496582, -4.207847595214844, -4.114377975463867, -4.020908355712891, -3.927438735961914, -3.8339691162109375, -3.740499496459961, -3.6470298767089844, -3.553560256958008, -3.460090398788452, -3.3666205406188965, -3.27315092086792, -3.1796813011169434, -3.086211681365967, -2.9927420616149902, -2.8992724418640137, -2.805802822113037, -2.7123329639434814, -2.618863582611084, -2.5253939628601074, -2.431924343109131, -2.3384547233581543, -2.2449851036071777, -2.151515483856201, -2.0580458641052246, -1.964576005935669, -1.871106505393982, -1.7776368856430054, -1.6841672658920288, -1.5906975269317627, -1.4972279071807861, -1.4037582874298096, -1.310288667678833, -1.2168190479278564, -1.1233494281768799, -1.0298798084259033, -0.936410129070282, -0.8429405093193054, -0.7494708299636841, -0.6560012102127075, -0.562531590461731, -0.4690619111061096, -0.3755922317504883, -0.28212258219718933, -0.18865294754505157, -0.09518331289291382, -0.0017136633396148682, 0.09175598621368408, 0.18522560596466064, 0.278695285320282, 0.37216490507125854, 0.4656345546245575, 0.5591042041778564, 0.652573823928833, 0.7460434436798096, 0.8395131230354309, 0.9329827427864075, 1.0264524221420288, 1.1199220418930054]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 8.0, 7.0, 13.0, 25.0, 22.0, 35.0, 28.0, 32.0, 33.0, 48.0, 48.0, 55.0, 53.0, 58.0, 57.0, 54.0, 59.0, 34.0, 48.0, 45.0, 45.0, 32.0, 34.0, 25.0, 19.0, 15.0, 15.0, 14.0, 9.0, 16.0, 5.0, 8.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.6427412033081055, -2.5790224075317383, -2.515303611755371, -2.451584815979004, -2.3878660202026367, -2.3241474628448486, -2.2604286670684814, -2.1967098712921143, -2.132991075515747, -2.06927227973938, -2.0055534839630127, -1.941834807395935, -1.8781160116195679, -1.8143972158432007, -1.750678539276123, -1.6869597434997559, -1.6232409477233887, -1.5595221519470215, -1.4958033561706543, -1.4320846796035767, -1.3683658838272095, -1.3046470880508423, -1.2409284114837646, -1.1772096157073975, -1.1134908199310303, -1.049772024154663, -0.9860532879829407, -0.9223345518112183, -0.8586157560348511, -0.7948969602584839, -0.7311782240867615, -0.6674594879150391, -0.6037404537200928, -0.5400216579437256, -0.4763029217720032, -0.4125841557979584, -0.3488653898239136, -0.2851466238498688, -0.22142785787582397, -0.15770909190177917, -0.09399032592773438, -0.030271559953689575, 0.033447206020355225, 0.09716597199440002, 0.16088473796844482, 0.22460350394248962, 0.2883222699165344, 0.3520410358905792, 0.415759801864624, 0.4794785678386688, 0.5431973338127136, 0.606916069984436, 0.6706348657608032, 0.7343536615371704, 0.7980723977088928, 0.8617911338806152, 0.9255099296569824, 0.9892287254333496, 1.0529475212097168, 1.1166661977767944, 1.1803849935531616, 1.2441037893295288, 1.3078224658966064, 1.3715412616729736, 1.4352600574493408]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 7.0, 16.0, 16.0, 19.0, 32.0, 58.0, 95.0, 152.0, 263.0, 559.0, 1171.0, 2562.0, 7579.0, 27542.0, 134505.0, 537799.0, 266264.0, 50563.0, 12281.0, 3966.0, 1521.0, 734.0, 324.0, 189.0, 111.0, 73.0, 46.0, 21.0, 20.0, 13.0, 16.0, 8.0, 11.0, 4.0, 2.0, 5.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.412109375, -3.323944091796875, -3.23577880859375, -3.147613525390625, -3.0594482421875, -2.971282958984375, -2.88311767578125, -2.794952392578125, -2.706787109375, -2.618621826171875, -2.53045654296875, -2.442291259765625, -2.3541259765625, -2.265960693359375, -2.17779541015625, -2.089630126953125, -2.00146484375, -1.913299560546875, -1.82513427734375, -1.736968994140625, -1.6488037109375, -1.560638427734375, -1.47247314453125, -1.384307861328125, -1.296142578125, -1.207977294921875, -1.11981201171875, -1.031646728515625, -0.9434814453125, -0.855316162109375, -0.76715087890625, -0.678985595703125, -0.5908203125, -0.502655029296875, -0.41448974609375, -0.326324462890625, -0.2381591796875, -0.149993896484375, -0.06182861328125, 0.026336669921875, 0.114501953125, 0.202667236328125, 0.29083251953125, 0.378997802734375, 0.4671630859375, 0.555328369140625, 0.64349365234375, 0.731658935546875, 0.81982421875, 0.907989501953125, 0.99615478515625, 1.084320068359375, 1.1724853515625, 1.260650634765625, 1.34881591796875, 1.436981201171875, 1.525146484375, 1.613311767578125, 1.70147705078125, 1.789642333984375, 1.8778076171875, 1.965972900390625, 2.05413818359375, 2.142303466796875, 2.23046875]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 8.0, 11.0, 8.0, 26.0, 34.0, 28.0, 45.0, 48.0, 68.0, 77.0, 84.0, 87.0, 80.0, 92.0, 64.0, 63.0, 45.0, 38.0, 35.0, 18.0, 23.0, 11.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.783203125, -0.7503204345703125, -0.717437744140625, -0.6845550537109375, -0.65167236328125, -0.6187896728515625, -0.585906982421875, -0.5530242919921875, -0.5201416015625, -0.4872589111328125, -0.454376220703125, -0.4214935302734375, -0.38861083984375, -0.3557281494140625, -0.322845458984375, -0.2899627685546875, -0.257080078125, -0.2241973876953125, -0.191314697265625, -0.1584320068359375, -0.12554931640625, -0.0926666259765625, -0.059783935546875, -0.0269012451171875, 0.0059814453125, 0.0388641357421875, 0.071746826171875, 0.1046295166015625, 0.13751220703125, 0.1703948974609375, 0.203277587890625, 0.2361602783203125, 0.26904296875, 0.3019256591796875, 0.334808349609375, 0.3676910400390625, 0.40057373046875, 0.4334564208984375, 0.466339111328125, 0.4992218017578125, 0.5321044921875, 0.5649871826171875, 0.597869873046875, 0.6307525634765625, 0.66363525390625, 0.6965179443359375, 0.729400634765625, 0.7622833251953125, 0.795166015625, 0.8280487060546875, 0.860931396484375, 0.8938140869140625, 0.92669677734375, 0.9595794677734375, 0.992462158203125, 1.0253448486328125, 1.0582275390625, 1.0911102294921875, 1.123992919921875, 1.1568756103515625, 1.18975830078125, 1.2226409912109375, 1.255523681640625, 1.2884063720703125, 1.3212890625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 7.0, 17.0, 21.0, 25.0, 34.0, 48.0, 55.0, 80.0, 152.0, 246.0, 437.0, 800.0, 1632.0, 3457.0, 8733.0, 24980.0, 82905.0, 288408.0, 423433.0, 146896.0, 42473.0, 13719.0, 5220.0, 2214.0, 1102.0, 580.0, 341.0, 173.0, 116.0, 72.0, 50.0, 32.0, 25.0, 22.0, 16.0, 9.0, 2.0, 5.0, 3.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4306640625, -1.379974365234375, -1.32928466796875, -1.278594970703125, -1.2279052734375, -1.177215576171875, -1.12652587890625, -1.075836181640625, -1.025146484375, -0.974456787109375, -0.92376708984375, -0.873077392578125, -0.8223876953125, -0.771697998046875, -0.72100830078125, -0.670318603515625, -0.61962890625, -0.568939208984375, -0.51824951171875, -0.467559814453125, -0.4168701171875, -0.366180419921875, -0.31549072265625, -0.264801025390625, -0.214111328125, -0.163421630859375, -0.11273193359375, -0.062042236328125, -0.0113525390625, 0.039337158203125, 0.09002685546875, 0.140716552734375, 0.19140625, 0.242095947265625, 0.29278564453125, 0.343475341796875, 0.3941650390625, 0.444854736328125, 0.49554443359375, 0.546234130859375, 0.596923828125, 0.647613525390625, 0.69830322265625, 0.748992919921875, 0.7996826171875, 0.850372314453125, 0.90106201171875, 0.951751708984375, 1.00244140625, 1.053131103515625, 1.10382080078125, 1.154510498046875, 1.2052001953125, 1.255889892578125, 1.30657958984375, 1.357269287109375, 1.407958984375, 1.458648681640625, 1.50933837890625, 1.560028076171875, 1.6107177734375, 1.661407470703125, 1.71209716796875, 1.762786865234375, 1.8134765625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 10.0, 9.0, 12.0, 14.0, 18.0, 13.0, 16.0, 17.0, 27.0, 29.0, 33.0, 34.0, 42.0, 44.0, 43.0, 48.0, 65.0, 44.0, 42.0, 56.0, 39.0, 40.0, 37.0, 30.0, 27.0, 28.0, 25.0, 31.0, 27.0, 20.0, 6.0, 13.0, 9.0, 11.0, 3.0, 7.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-2.646484375, -2.56683349609375, -2.4871826171875, -2.40753173828125, -2.327880859375, -2.24822998046875, -2.1685791015625, -2.08892822265625, -2.00927734375, -1.92962646484375, -1.8499755859375, -1.77032470703125, -1.690673828125, -1.61102294921875, -1.5313720703125, -1.45172119140625, -1.3720703125, -1.29241943359375, -1.2127685546875, -1.13311767578125, -1.053466796875, -0.97381591796875, -0.8941650390625, -0.81451416015625, -0.73486328125, -0.65521240234375, -0.5755615234375, -0.49591064453125, -0.416259765625, -0.33660888671875, -0.2569580078125, -0.17730712890625, -0.09765625, -0.01800537109375, 0.0616455078125, 0.14129638671875, 0.220947265625, 0.30059814453125, 0.3802490234375, 0.45989990234375, 0.53955078125, 0.61920166015625, 0.6988525390625, 0.77850341796875, 0.858154296875, 0.93780517578125, 1.0174560546875, 1.09710693359375, 1.1767578125, 1.25640869140625, 1.3360595703125, 1.41571044921875, 1.495361328125, 1.57501220703125, 1.6546630859375, 1.73431396484375, 1.81396484375, 1.89361572265625, 1.9732666015625, 2.05291748046875, 2.132568359375, 2.21221923828125, 2.2918701171875, 2.37152099609375, 2.451171875]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 12.0, 17.0, 25.0, 35.0, 49.0, 90.0, 145.0, 301.0, 635.0, 1912.0, 9024.0, 137835.0, 842480.0, 48715.0, 5011.0, 1226.0, 505.0, 220.0, 119.0, 82.0, 36.0, 25.0, 15.0, 12.0, 13.0, 7.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5849609375, -1.53594970703125, -1.4869384765625, -1.43792724609375, -1.388916015625, -1.33990478515625, -1.2908935546875, -1.24188232421875, -1.19287109375, -1.14385986328125, -1.0948486328125, -1.04583740234375, -0.996826171875, -0.94781494140625, -0.8988037109375, -0.84979248046875, -0.80078125, -0.75177001953125, -0.7027587890625, -0.65374755859375, -0.604736328125, -0.55572509765625, -0.5067138671875, -0.45770263671875, -0.40869140625, -0.35968017578125, -0.3106689453125, -0.26165771484375, -0.212646484375, -0.16363525390625, -0.1146240234375, -0.06561279296875, -0.0166015625, 0.03240966796875, 0.0814208984375, 0.13043212890625, 0.179443359375, 0.22845458984375, 0.2774658203125, 0.32647705078125, 0.37548828125, 0.42449951171875, 0.4735107421875, 0.52252197265625, 0.571533203125, 0.62054443359375, 0.6695556640625, 0.71856689453125, 0.767578125, 0.81658935546875, 0.8656005859375, 0.91461181640625, 0.963623046875, 1.01263427734375, 1.0616455078125, 1.11065673828125, 1.15966796875, 1.20867919921875, 1.2576904296875, 1.30670166015625, 1.355712890625, 1.40472412109375, 1.4537353515625, 1.50274658203125, 1.5517578125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 7.0, 5.0, 4.0, 15.0, 20.0, 24.0, 47.0, 50.0, 61.0, 102.0, 146.0, 170.0, 95.0, 67.0, 66.0, 40.0, 34.0, 18.0, 10.0, 7.0, 5.0, 6.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013375282287597656, -0.00012674182653427124, -0.00011973083019256592, -0.0001127198338508606, -0.00010570883750915527, -9.869784116744995e-05, -9.168684482574463e-05, -8.46758484840393e-05, -7.766485214233398e-05, -7.065385580062866e-05, -6.364285945892334e-05, -5.663186311721802e-05, -4.9620866775512695e-05, -4.260987043380737e-05, -3.559887409210205e-05, -2.858787775039673e-05, -2.1576881408691406e-05, -1.4565885066986084e-05, -7.554888725280762e-06, -5.438923835754395e-07, 6.467103958129883e-06, 1.3478100299835205e-05, 2.0489096641540527e-05, 2.750009298324585e-05, 3.451108932495117e-05, 4.1522085666656494e-05, 4.8533082008361816e-05, 5.554407835006714e-05, 6.255507469177246e-05, 6.956607103347778e-05, 7.65770673751831e-05, 8.358806371688843e-05, 9.059906005859375e-05, 9.761005640029907e-05, 0.0001046210527420044, 0.00011163204908370972, 0.00011864304542541504, 0.00012565404176712036, 0.00013266503810882568, 0.000139676034450531, 0.00014668703079223633, 0.00015369802713394165, 0.00016070902347564697, 0.0001677200198173523, 0.00017473101615905762, 0.00018174201250076294, 0.00018875300884246826, 0.00019576400518417358, 0.0002027750015258789, 0.00020978599786758423, 0.00021679699420928955, 0.00022380799055099487, 0.0002308189868927002, 0.00023782998323440552, 0.00024484097957611084, 0.00025185197591781616, 0.0002588629722595215, 0.0002658739686012268, 0.00027288496494293213, 0.00027989596128463745, 0.0002869069576263428, 0.0002939179539680481, 0.0003009289503097534, 0.00030793994665145874, 0.00031495094299316406]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 10.0, 16.0, 25.0, 52.0, 97.0, 158.0, 370.0, 1077.0, 4840.0, 56575.0, 843474.0, 131313.0, 8084.0, 1526.0, 478.0, 197.0, 106.0, 65.0, 28.0, 25.0, 21.0, 10.0, 6.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5380859375, -1.486175537109375, -1.43426513671875, -1.382354736328125, -1.3304443359375, -1.278533935546875, -1.22662353515625, -1.174713134765625, -1.122802734375, -1.070892333984375, -1.01898193359375, -0.967071533203125, -0.9151611328125, -0.863250732421875, -0.81134033203125, -0.759429931640625, -0.70751953125, -0.655609130859375, -0.60369873046875, -0.551788330078125, -0.4998779296875, -0.447967529296875, -0.39605712890625, -0.344146728515625, -0.292236328125, -0.240325927734375, -0.18841552734375, -0.136505126953125, -0.0845947265625, -0.032684326171875, 0.01922607421875, 0.071136474609375, 0.123046875, 0.174957275390625, 0.22686767578125, 0.278778076171875, 0.3306884765625, 0.382598876953125, 0.43450927734375, 0.486419677734375, 0.538330078125, 0.590240478515625, 0.64215087890625, 0.694061279296875, 0.7459716796875, 0.797882080078125, 0.84979248046875, 0.901702880859375, 0.95361328125, 1.005523681640625, 1.05743408203125, 1.109344482421875, 1.1612548828125, 1.213165283203125, 1.26507568359375, 1.316986083984375, 1.368896484375, 1.420806884765625, 1.47271728515625, 1.524627685546875, 1.5765380859375, 1.628448486328125, 1.68035888671875, 1.732269287109375, 1.7841796875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 7.0, 20.0, 31.0, 57.0, 92.0, 167.0, 231.0, 194.0, 82.0, 54.0, 30.0, 20.0, 10.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.951171875, -0.88983154296875, -0.8284912109375, -0.76715087890625, -0.705810546875, -0.64447021484375, -0.5831298828125, -0.52178955078125, -0.46044921875, -0.39910888671875, -0.3377685546875, -0.27642822265625, -0.215087890625, -0.15374755859375, -0.0924072265625, -0.03106689453125, 0.0302734375, 0.09161376953125, 0.1529541015625, 0.21429443359375, 0.275634765625, 0.33697509765625, 0.3983154296875, 0.45965576171875, 0.52099609375, 0.58233642578125, 0.6436767578125, 0.70501708984375, 0.766357421875, 0.82769775390625, 0.8890380859375, 0.95037841796875, 1.01171875, 1.07305908203125, 1.1343994140625, 1.19573974609375, 1.257080078125, 1.31842041015625, 1.3797607421875, 1.44110107421875, 1.50244140625, 1.56378173828125, 1.6251220703125, 1.68646240234375, 1.747802734375, 1.80914306640625, 1.8704833984375, 1.93182373046875, 1.9931640625, 2.05450439453125, 2.1158447265625, 2.17718505859375, 2.238525390625, 2.29986572265625, 2.3612060546875, 2.42254638671875, 2.48388671875, 2.54522705078125, 2.6065673828125, 2.66790771484375, 2.729248046875, 2.79058837890625, 2.8519287109375, 2.91326904296875, 2.974609375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 7.0, 21.0, 51.0, 118.0, 249.0, 301.0, 168.0, 61.0, 18.0, 11.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.860965728759766, -47.90804672241211, -46.95512390136719, -46.00220489501953, -45.04928207397461, -44.09636306762695, -43.14344024658203, -42.190521240234375, -41.23760223388672, -40.28468322753906, -39.33176040649414, -38.378841400146484, -37.42591857910156, -36.472999572753906, -35.520076751708984, -34.56715774536133, -33.614234924316406, -32.66131591796875, -31.708393096923828, -30.75547218322754, -29.80255126953125, -28.849632263183594, -27.896711349487305, -26.943790435791016, -25.990869522094727, -25.037948608398438, -24.08502769470215, -23.13210678100586, -22.179187774658203, -21.22626495361328, -20.273345947265625, -19.320425033569336, -18.367504119873047, -17.414583206176758, -16.46166229248047, -15.508742332458496, -14.555821418762207, -13.602900505065918, -12.649980545043945, -11.697059631347656, -10.744139671325684, -9.791218757629395, -8.838298797607422, -7.885377883911133, -6.932456970214844, -5.979536056518555, -5.026615619659424, -4.073695182800293, -3.120774269104004, -2.167853593826294, -1.214932918548584, -0.262012243270874, 0.6909084320068359, 1.643829345703125, 2.596749782562256, 3.5496702194213867, 4.502591133117676, 5.455512046813965, 6.408432483673096, 7.361352920532227, 8.314273834228516, 9.267194747924805, 10.220115661621094, 11.173035621643066, 12.125956535339355]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0, 10.0, 6.0, 16.0, 13.0, 15.0, 14.0, 21.0, 23.0, 25.0, 29.0, 21.0, 29.0, 28.0, 28.0, 34.0, 23.0, 38.0, 43.0, 40.0, 44.0, 44.0, 45.0, 36.0, 35.0, 40.0, 33.0, 33.0, 25.0, 28.0, 22.0, 20.0, 19.0, 21.0, 19.0, 19.0, 6.0, 14.0, 10.0, 10.0, 3.0, 7.0, 4.0, 8.0, 0.0, 1.0, 3.0], "bins": [-14.676142692565918, -14.284707069396973, -13.893271446228027, -13.501835823059082, -13.11039924621582, -12.718963623046875, -12.32752799987793, -11.936092376708984, -11.544656753540039, -11.153221130371094, -10.761785507202148, -10.370349884033203, -9.978914260864258, -9.587477684020996, -9.19604206085205, -8.804606437683105, -8.41317081451416, -8.021735191345215, -7.6302995681762695, -7.238863468170166, -6.847427845001221, -6.455992221832275, -6.064556121826172, -5.673120498657227, -5.281684875488281, -4.890249252319336, -4.498813629150391, -4.107377529144287, -3.715941905975342, -3.3245062828063965, -2.933070421218872, -2.5416345596313477, -2.150197982788086, -1.758762240409851, -1.3673264980316162, -0.9758907556533813, -0.5844550132751465, -0.19301927089691162, 0.19841647148132324, 0.5898523330688477, 0.981287956237793, 1.3727236986160278, 1.7641594409942627, 2.155595302581787, 2.5470309257507324, 2.9384665489196777, 3.329902410507202, 3.7213382720947266, 4.112773895263672, 4.504209518432617, 4.8956451416015625, 5.287081241607666, 5.678516864776611, 6.069952487945557, 6.46138858795166, 6.8528242111206055, 7.244259834289551, 7.635695457458496, 8.027131080627441, 8.418566703796387, 8.810003280639648, 9.201438903808594, 9.592874526977539, 9.984310150146484, 10.37574577331543]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 6.0, 15.0, 16.0, 22.0, 41.0, 61.0, 120.0, 195.0, 384.0, 942.0, 2406.0, 9153.0, 79609.0, 3972023.0, 112574.0, 11427.0, 2948.0, 1094.0, 524.0, 276.0, 163.0, 84.0, 51.0, 42.0, 24.0, 20.0, 13.0, 14.0, 8.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.900390625, -2.791168212890625, -2.68194580078125, -2.572723388671875, -2.4635009765625, -2.354278564453125, -2.24505615234375, -2.135833740234375, -2.026611328125, -1.917388916015625, -1.80816650390625, -1.698944091796875, -1.5897216796875, -1.480499267578125, -1.37127685546875, -1.262054443359375, -1.15283203125, -1.043609619140625, -0.93438720703125, -0.825164794921875, -0.7159423828125, -0.606719970703125, -0.49749755859375, -0.388275146484375, -0.279052734375, -0.169830322265625, -0.06060791015625, 0.048614501953125, 0.1578369140625, 0.267059326171875, 0.37628173828125, 0.485504150390625, 0.5947265625, 0.703948974609375, 0.81317138671875, 0.922393798828125, 1.0316162109375, 1.140838623046875, 1.25006103515625, 1.359283447265625, 1.468505859375, 1.577728271484375, 1.68695068359375, 1.796173095703125, 1.9053955078125, 2.014617919921875, 2.12384033203125, 2.233062744140625, 2.34228515625, 2.451507568359375, 2.56072998046875, 2.669952392578125, 2.7791748046875, 2.888397216796875, 2.99761962890625, 3.106842041015625, 3.216064453125, 3.325286865234375, 3.43450927734375, 3.543731689453125, 3.6529541015625, 3.762176513671875, 3.87139892578125, 3.980621337890625, 4.08984375]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 8.0, 9.0, 18.0, 26.0, 33.0, 38.0, 49.0, 55.0, 64.0, 86.0, 72.0, 86.0, 78.0, 77.0, 56.0, 59.0, 51.0, 37.0, 31.0, 21.0, 18.0, 12.0, 12.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74169921875, -0.7072372436523438, -0.6727752685546875, -0.6383132934570312, -0.603851318359375, -0.5693893432617188, -0.5349273681640625, -0.5004653930664062, -0.46600341796875, -0.43154144287109375, -0.3970794677734375, -0.36261749267578125, -0.328155517578125, -0.29369354248046875, -0.2592315673828125, -0.22476959228515625, -0.1903076171875, -0.15584564208984375, -0.1213836669921875, -0.08692169189453125, -0.052459716796875, -0.01799774169921875, 0.0164642333984375, 0.05092620849609375, 0.08538818359375, 0.11985015869140625, 0.1543121337890625, 0.18877410888671875, 0.223236083984375, 0.25769805908203125, 0.2921600341796875, 0.32662200927734375, 0.361083984375, 0.39554595947265625, 0.4300079345703125, 0.46446990966796875, 0.498931884765625, 0.5333938598632812, 0.5678558349609375, 0.6023178100585938, 0.63677978515625, 0.6712417602539062, 0.7057037353515625, 0.7401657104492188, 0.774627685546875, 0.8090896606445312, 0.8435516357421875, 0.8780136108398438, 0.9124755859375, 0.9469375610351562, 0.9813995361328125, 1.0158615112304688, 1.050323486328125, 1.0847854614257812, 1.1192474365234375, 1.1537094116210938, 1.18817138671875, 1.2226333618164062, 1.2570953369140625, 1.2915573120117188, 1.326019287109375, 1.3604812622070312, 1.3949432373046875, 1.4294052124023438, 1.4638671875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 9.0, 8.0, 22.0, 29.0, 32.0, 44.0, 97.0, 140.0, 259.0, 487.0, 785.0, 1789.0, 4890.0, 19434.0, 171808.0, 3785308.0, 180458.0, 19885.0, 4964.0, 1879.0, 850.0, 458.0, 242.0, 144.0, 98.0, 59.0, 45.0, 24.0, 17.0, 8.0, 9.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6904296875, -1.6241607666015625, -1.557891845703125, -1.4916229248046875, -1.42535400390625, -1.3590850830078125, -1.292816162109375, -1.2265472412109375, -1.1602783203125, -1.0940093994140625, -1.027740478515625, -0.9614715576171875, -0.89520263671875, -0.8289337158203125, -0.762664794921875, -0.6963958740234375, -0.630126953125, -0.5638580322265625, -0.497589111328125, -0.4313201904296875, -0.36505126953125, -0.2987823486328125, -0.232513427734375, -0.1662445068359375, -0.0999755859375, -0.0337066650390625, 0.032562255859375, 0.0988311767578125, 0.16510009765625, 0.2313690185546875, 0.297637939453125, 0.3639068603515625, 0.43017578125, 0.4964447021484375, 0.562713623046875, 0.6289825439453125, 0.69525146484375, 0.7615203857421875, 0.827789306640625, 0.8940582275390625, 0.9603271484375, 1.0265960693359375, 1.092864990234375, 1.1591339111328125, 1.22540283203125, 1.2916717529296875, 1.357940673828125, 1.4242095947265625, 1.490478515625, 1.5567474365234375, 1.623016357421875, 1.6892852783203125, 1.75555419921875, 1.8218231201171875, 1.888092041015625, 1.9543609619140625, 2.0206298828125, 2.0868988037109375, 2.153167724609375, 2.2194366455078125, 2.28570556640625, 2.3519744873046875, 2.418243408203125, 2.4845123291015625, 2.55078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 8.0, 17.0, 28.0, 39.0, 106.0, 235.0, 1648.0, 1593.0, 232.0, 75.0, 39.0, 16.0, 14.0, 10.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.498046875, -1.4481048583984375, -1.398162841796875, -1.3482208251953125, -1.29827880859375, -1.2483367919921875, -1.198394775390625, -1.1484527587890625, -1.0985107421875, -1.0485687255859375, -0.998626708984375, -0.9486846923828125, -0.89874267578125, -0.8488006591796875, -0.798858642578125, -0.7489166259765625, -0.698974609375, -0.6490325927734375, -0.599090576171875, -0.5491485595703125, -0.49920654296875, -0.4492645263671875, -0.399322509765625, -0.3493804931640625, -0.2994384765625, -0.2494964599609375, -0.199554443359375, -0.1496124267578125, -0.09967041015625, -0.0497283935546875, 0.000213623046875, 0.0501556396484375, 0.10009765625, 0.1500396728515625, 0.199981689453125, 0.2499237060546875, 0.29986572265625, 0.3498077392578125, 0.399749755859375, 0.4496917724609375, 0.4996337890625, 0.5495758056640625, 0.599517822265625, 0.6494598388671875, 0.69940185546875, 0.7493438720703125, 0.799285888671875, 0.8492279052734375, 0.899169921875, 0.9491119384765625, 0.999053955078125, 1.0489959716796875, 1.09893798828125, 1.1488800048828125, 1.198822021484375, 1.2487640380859375, 1.2987060546875, 1.3486480712890625, 1.398590087890625, 1.4485321044921875, 1.49847412109375, 1.5484161376953125, 1.598358154296875, 1.6483001708984375, 1.6982421875]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 5.0, 8.0, 18.0, 26.0, 60.0, 111.0, 152.0, 196.0, 178.0, 125.0, 58.0, 28.0, 12.0, 11.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.8100481033325195, -7.638354778289795, -7.46666145324707, -7.294968128204346, -7.123274803161621, -6.951581954956055, -6.779888153076172, -6.6081953048706055, -6.436501979827881, -6.264808654785156, -6.093115329742432, -5.921422004699707, -5.749728679656982, -5.578035354614258, -5.406342506408691, -5.234649181365967, -5.062955856323242, -4.891262531280518, -4.719569206237793, -4.547875881195068, -4.376182556152344, -4.204489707946777, -4.0327959060668945, -3.861103057861328, -3.6894092559814453, -3.5177159309387207, -3.346022605895996, -3.1743292808532715, -3.002636194229126, -2.8309428691864014, -2.6592495441436768, -2.4875564575195312, -2.3158633708953857, -2.144170045852661, -1.972476840019226, -1.8007835149765015, -1.6290903091430664, -1.4573969841003418, -1.2857036590576172, -1.1140104532241821, -0.9423171281814575, -0.7706238627433777, -0.5989305973052979, -0.42723727226257324, -0.2555440068244934, -0.08385074138641357, 0.08784258365631104, 0.2595357894897461, 0.4312291145324707, 0.6029223799705505, 0.7746156454086304, 0.946308970451355, 1.11800217628479, 1.2896955013275146, 1.4613888263702393, 1.6330820322036743, 1.804775357246399, 1.9764686822891235, 2.1481618881225586, 2.319855213165283, 2.491548538208008, 2.6632418632507324, 2.834935188293457, 3.0066282749176025, 3.178321599960327]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 0.0, 7.0, 7.0, 11.0, 18.0, 24.0, 21.0, 29.0, 30.0, 35.0, 51.0, 47.0, 48.0, 43.0, 59.0, 41.0, 52.0, 73.0, 44.0, 46.0, 58.0, 42.0, 33.0, 31.0, 27.0, 20.0, 23.0, 10.0, 16.0, 11.0, 10.0, 5.0, 6.0, 5.0, 4.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.2356553077697754, -3.1369307041168213, -3.038206100463867, -2.939481496810913, -2.840756893157959, -2.742032289505005, -2.643307685852051, -2.5445830821990967, -2.4458584785461426, -2.3471338748931885, -2.2484092712402344, -2.1496846675872803, -2.050960063934326, -1.952235460281372, -1.853510856628418, -1.7547862529754639, -1.6560615301132202, -1.5573369264602661, -1.458612322807312, -1.359887719154358, -1.2611631155014038, -1.1624385118484497, -1.063713788986206, -0.9649892449378967, -0.8662646412849426, -0.7675400376319885, -0.6688154339790344, -0.5700907707214355, -0.47136619687080383, -0.37264159321784973, -0.27391695976257324, -0.17519235610961914, -0.07646775245666504, 0.02225685864686966, 0.12098146975040436, 0.21970608830451965, 0.31843069195747375, 0.41715529561042786, 0.5158799290657043, 0.6146045327186584, 0.7133291363716125, 0.8120537400245667, 0.9107783436775208, 1.0095030069351196, 1.1082276105880737, 1.2069522142410278, 1.305676817893982, 1.404401421546936, 1.5031260251998901, 1.6018506288528442, 1.7005752325057983, 1.7992998361587524, 1.8980244398117065, 1.9967490434646606, 2.0954737663269043, 2.1941983699798584, 2.2929229736328125, 2.3916475772857666, 2.4903721809387207, 2.589096784591675, 2.687821388244629, 2.786545991897583, 2.885270595550537, 2.983995199203491, 3.0827198028564453]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 7.0, 8.0, 16.0, 42.0, 51.0, 97.0, 186.0, 439.0, 1035.0, 3396.0, 15803.0, 130895.0, 690584.0, 179780.0, 20052.0, 4031.0, 1168.0, 470.0, 221.0, 96.0, 70.0, 39.0, 21.0, 15.0, 8.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.568359375, -3.447662353515625, -3.32696533203125, -3.206268310546875, -3.0855712890625, -2.964874267578125, -2.84417724609375, -2.723480224609375, -2.602783203125, -2.482086181640625, -2.36138916015625, -2.240692138671875, -2.1199951171875, -1.999298095703125, -1.87860107421875, -1.757904052734375, -1.63720703125, -1.516510009765625, -1.39581298828125, -1.275115966796875, -1.1544189453125, -1.033721923828125, -0.91302490234375, -0.792327880859375, -0.671630859375, -0.550933837890625, -0.43023681640625, -0.309539794921875, -0.1888427734375, -0.068145751953125, 0.05255126953125, 0.173248291015625, 0.2939453125, 0.414642333984375, 0.53533935546875, 0.656036376953125, 0.7767333984375, 0.897430419921875, 1.01812744140625, 1.138824462890625, 1.259521484375, 1.380218505859375, 1.50091552734375, 1.621612548828125, 1.7423095703125, 1.863006591796875, 1.98370361328125, 2.104400634765625, 2.22509765625, 2.345794677734375, 2.46649169921875, 2.587188720703125, 2.7078857421875, 2.828582763671875, 2.94927978515625, 3.069976806640625, 3.190673828125, 3.311370849609375, 3.43206787109375, 3.552764892578125, 3.6734619140625, 3.794158935546875, 3.91485595703125, 4.035552978515625, 4.15625]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 8.0, 9.0, 11.0, 17.0, 24.0, 41.0, 48.0, 53.0, 47.0, 71.0, 94.0, 76.0, 84.0, 92.0, 69.0, 65.0, 49.0, 41.0, 30.0, 30.0, 21.0, 13.0, 5.0, 8.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76171875, -0.725555419921875, -0.68939208984375, -0.653228759765625, -0.6170654296875, -0.580902099609375, -0.54473876953125, -0.508575439453125, -0.472412109375, -0.436248779296875, -0.40008544921875, -0.363922119140625, -0.3277587890625, -0.291595458984375, -0.25543212890625, -0.219268798828125, -0.18310546875, -0.146942138671875, -0.11077880859375, -0.074615478515625, -0.0384521484375, -0.002288818359375, 0.03387451171875, 0.070037841796875, 0.106201171875, 0.142364501953125, 0.17852783203125, 0.214691162109375, 0.2508544921875, 0.287017822265625, 0.32318115234375, 0.359344482421875, 0.3955078125, 0.431671142578125, 0.46783447265625, 0.503997802734375, 0.5401611328125, 0.576324462890625, 0.61248779296875, 0.648651123046875, 0.684814453125, 0.720977783203125, 0.75714111328125, 0.793304443359375, 0.8294677734375, 0.865631103515625, 0.90179443359375, 0.937957763671875, 0.97412109375, 1.010284423828125, 1.04644775390625, 1.082611083984375, 1.1187744140625, 1.154937744140625, 1.19110107421875, 1.227264404296875, 1.263427734375, 1.299591064453125, 1.33575439453125, 1.371917724609375, 1.4080810546875, 1.444244384765625, 1.48040771484375, 1.516571044921875, 1.552734375]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 6.0, 7.0, 11.0, 20.0, 55.0, 94.0, 169.0, 391.0, 975.0, 3080.0, 17363.0, 233256.0, 722368.0, 60990.0, 6957.0, 1664.0, 637.0, 267.0, 105.0, 68.0, 30.0, 14.0, 12.0, 6.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.125, -3.98870849609375, -3.8524169921875, -3.71612548828125, -3.579833984375, -3.44354248046875, -3.3072509765625, -3.17095947265625, -3.03466796875, -2.89837646484375, -2.7620849609375, -2.62579345703125, -2.489501953125, -2.35321044921875, -2.2169189453125, -2.08062744140625, -1.9443359375, -1.80804443359375, -1.6717529296875, -1.53546142578125, -1.399169921875, -1.26287841796875, -1.1265869140625, -0.99029541015625, -0.85400390625, -0.71771240234375, -0.5814208984375, -0.44512939453125, -0.308837890625, -0.17254638671875, -0.0362548828125, 0.10003662109375, 0.236328125, 0.37261962890625, 0.5089111328125, 0.64520263671875, 0.781494140625, 0.91778564453125, 1.0540771484375, 1.19036865234375, 1.32666015625, 1.46295166015625, 1.5992431640625, 1.73553466796875, 1.871826171875, 2.00811767578125, 2.1444091796875, 2.28070068359375, 2.4169921875, 2.55328369140625, 2.6895751953125, 2.82586669921875, 2.962158203125, 3.09844970703125, 3.2347412109375, 3.37103271484375, 3.50732421875, 3.64361572265625, 3.7799072265625, 3.91619873046875, 4.052490234375, 4.18878173828125, 4.3250732421875, 4.46136474609375, 4.59765625]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 3.0, 5.0, 8.0, 7.0, 6.0, 7.0, 13.0, 13.0, 18.0, 21.0, 25.0, 23.0, 41.0, 38.0, 29.0, 41.0, 60.0, 37.0, 44.0, 54.0, 58.0, 59.0, 50.0, 60.0, 43.0, 45.0, 33.0, 35.0, 28.0, 25.0, 12.0, 14.0, 13.0, 12.0, 6.0, 10.0, 6.0, 3.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.0625, -3.94049072265625, -3.8184814453125, -3.69647216796875, -3.574462890625, -3.45245361328125, -3.3304443359375, -3.20843505859375, -3.08642578125, -2.96441650390625, -2.8424072265625, -2.72039794921875, -2.598388671875, -2.47637939453125, -2.3543701171875, -2.23236083984375, -2.1103515625, -1.98834228515625, -1.8663330078125, -1.74432373046875, -1.622314453125, -1.50030517578125, -1.3782958984375, -1.25628662109375, -1.13427734375, -1.01226806640625, -0.8902587890625, -0.76824951171875, -0.646240234375, -0.52423095703125, -0.4022216796875, -0.28021240234375, -0.158203125, -0.03619384765625, 0.0858154296875, 0.20782470703125, 0.329833984375, 0.45184326171875, 0.5738525390625, 0.69586181640625, 0.81787109375, 0.93988037109375, 1.0618896484375, 1.18389892578125, 1.305908203125, 1.42791748046875, 1.5499267578125, 1.67193603515625, 1.7939453125, 1.91595458984375, 2.0379638671875, 2.15997314453125, 2.281982421875, 2.40399169921875, 2.5260009765625, 2.64801025390625, 2.77001953125, 2.89202880859375, 3.0140380859375, 3.13604736328125, 3.258056640625, 3.38006591796875, 3.5020751953125, 3.62408447265625, 3.74609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 14.0, 16.0, 45.0, 54.0, 115.0, 228.0, 606.0, 2111.0, 17220.0, 660517.0, 354846.0, 10269.0, 1588.0, 491.0, 224.0, 83.0, 46.0, 27.0, 19.0, 12.0, 6.0, 7.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.888671875, -1.82098388671875, -1.7532958984375, -1.68560791015625, -1.617919921875, -1.55023193359375, -1.4825439453125, -1.41485595703125, -1.34716796875, -1.27947998046875, -1.2117919921875, -1.14410400390625, -1.076416015625, -1.00872802734375, -0.9410400390625, -0.87335205078125, -0.8056640625, -0.73797607421875, -0.6702880859375, -0.60260009765625, -0.534912109375, -0.46722412109375, -0.3995361328125, -0.33184814453125, -0.26416015625, -0.19647216796875, -0.1287841796875, -0.06109619140625, 0.006591796875, 0.07427978515625, 0.1419677734375, 0.20965576171875, 0.27734375, 0.34503173828125, 0.4127197265625, 0.48040771484375, 0.548095703125, 0.61578369140625, 0.6834716796875, 0.75115966796875, 0.81884765625, 0.88653564453125, 0.9542236328125, 1.02191162109375, 1.089599609375, 1.15728759765625, 1.2249755859375, 1.29266357421875, 1.3603515625, 1.42803955078125, 1.4957275390625, 1.56341552734375, 1.631103515625, 1.69879150390625, 1.7664794921875, 1.83416748046875, 1.90185546875, 1.96954345703125, 2.0372314453125, 2.10491943359375, 2.172607421875, 2.24029541015625, 2.3079833984375, 2.37567138671875, 2.443359375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 7.0, 6.0, 3.0, 10.0, 34.0, 76.0, 193.0, 305.0, 212.0, 96.0, 39.0, 10.0, 11.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00055694580078125, -0.0005398094654083252, -0.0005226731300354004, -0.0005055367946624756, -0.0004884004592895508, -0.000471264123916626, -0.00045412778854370117, -0.00043699145317077637, -0.00041985511779785156, -0.00040271878242492676, -0.00038558244705200195, -0.00036844611167907715, -0.00035130977630615234, -0.00033417344093322754, -0.00031703710556030273, -0.00029990077018737793, -0.0002827644348144531, -0.0002656280994415283, -0.0002484917640686035, -0.0002313554286956787, -0.0002142190933227539, -0.0001970827579498291, -0.0001799464225769043, -0.0001628100872039795, -0.0001456737518310547, -0.00012853741645812988, -0.00011140108108520508, -9.426474571228027e-05, -7.712841033935547e-05, -5.9992074966430664e-05, -4.285573959350586e-05, -2.5719404220581055e-05, -8.58306884765625e-06, 8.553266525268555e-06, 2.568960189819336e-05, 4.2825937271118164e-05, 5.996227264404297e-05, 7.709860801696777e-05, 9.423494338989258e-05, 0.00011137127876281738, 0.0001285076141357422, 0.000145643949508667, 0.0001627802848815918, 0.0001799166202545166, 0.0001970529556274414, 0.0002141892910003662, 0.00023132562637329102, 0.0002484619617462158, 0.0002655982971191406, 0.00028273463249206543, 0.00029987096786499023, 0.00031700730323791504, 0.00033414363861083984, 0.00035127997398376465, 0.00036841630935668945, 0.00038555264472961426, 0.00040268898010253906, 0.00041982531547546387, 0.00043696165084838867, 0.0004540979862213135, 0.0004712343215942383, 0.0004883706569671631, 0.0005055069923400879, 0.0005226433277130127, 0.0005397796630859375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 7.0, 17.0, 20.0, 44.0, 85.0, 134.0, 328.0, 834.0, 3079.0, 20326.0, 399521.0, 587387.0, 31219.0, 3813.0, 1027.0, 352.0, 186.0, 68.0, 46.0, 29.0, 15.0, 10.0, 5.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4697265625, -1.417388916015625, -1.36505126953125, -1.312713623046875, -1.2603759765625, -1.208038330078125, -1.15570068359375, -1.103363037109375, -1.051025390625, -0.998687744140625, -0.94635009765625, -0.894012451171875, -0.8416748046875, -0.789337158203125, -0.73699951171875, -0.684661865234375, -0.63232421875, -0.579986572265625, -0.52764892578125, -0.475311279296875, -0.4229736328125, -0.370635986328125, -0.31829833984375, -0.265960693359375, -0.213623046875, -0.161285400390625, -0.10894775390625, -0.056610107421875, -0.0042724609375, 0.048065185546875, 0.10040283203125, 0.152740478515625, 0.205078125, 0.257415771484375, 0.30975341796875, 0.362091064453125, 0.4144287109375, 0.466766357421875, 0.51910400390625, 0.571441650390625, 0.623779296875, 0.676116943359375, 0.72845458984375, 0.780792236328125, 0.8331298828125, 0.885467529296875, 0.93780517578125, 0.990142822265625, 1.04248046875, 1.094818115234375, 1.14715576171875, 1.199493408203125, 1.2518310546875, 1.304168701171875, 1.35650634765625, 1.408843994140625, 1.461181640625, 1.513519287109375, 1.56585693359375, 1.618194580078125, 1.6705322265625, 1.722869873046875, 1.77520751953125, 1.827545166015625, 1.8798828125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 11.0, 25.0, 32.0, 76.0, 142.0, 239.0, 197.0, 128.0, 67.0, 32.0, 20.0, 12.0, 6.0, 7.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.931732177734375, -2.84783935546875, -2.763946533203125, -2.6800537109375, -2.596160888671875, -2.51226806640625, -2.428375244140625, -2.344482421875, -2.260589599609375, -2.17669677734375, -2.092803955078125, -2.0089111328125, -1.925018310546875, -1.84112548828125, -1.757232666015625, -1.67333984375, -1.589447021484375, -1.50555419921875, -1.421661376953125, -1.3377685546875, -1.253875732421875, -1.16998291015625, -1.086090087890625, -1.002197265625, -0.918304443359375, -0.83441162109375, -0.750518798828125, -0.6666259765625, -0.582733154296875, -0.49884033203125, -0.414947509765625, -0.3310546875, -0.247161865234375, -0.16326904296875, -0.079376220703125, 0.0045166015625, 0.088409423828125, 0.17230224609375, 0.256195068359375, 0.340087890625, 0.423980712890625, 0.50787353515625, 0.591766357421875, 0.6756591796875, 0.759552001953125, 0.84344482421875, 0.927337646484375, 1.01123046875, 1.095123291015625, 1.17901611328125, 1.262908935546875, 1.3468017578125, 1.430694580078125, 1.51458740234375, 1.598480224609375, 1.682373046875, 1.766265869140625, 1.85015869140625, 1.934051513671875, 2.0179443359375, 2.101837158203125, 2.18572998046875, 2.269622802734375, 2.353515625]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 7.0, 4.0, 16.0, 23.0, 48.0, 85.0, 148.0, 182.0, 163.0, 138.0, 86.0, 58.0, 22.0, 10.0, 8.0, 7.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.656537055969238, -11.912866592407227, -11.169195175170898, -10.425524711608887, -9.681854248046875, -8.938183784484863, -8.194513320922852, -7.450841903686523, -6.707171440124512, -5.9635009765625, -5.21983003616333, -4.47615909576416, -3.7324886322021484, -2.9888179302215576, -2.245147228240967, -1.5014762878417969, -0.7578058242797852, -0.014135122299194336, 0.7295355796813965, 1.4732062816619873, 2.216876983642578, 2.960547685623169, 3.7042183876037598, 4.44788932800293, 5.191559791564941, 5.935230255126953, 6.678901195526123, 7.422572135925293, 8.166242599487305, 8.909913063049316, 9.653583526611328, 10.397254943847656, 11.140926361083984, 11.884596824645996, 12.628267288208008, 13.371938705444336, 14.115609169006348, 14.85927963256836, 15.602951049804688, 16.346622467041016, 17.09029197692871, 17.83396339416504, 18.577632904052734, 19.321304321289062, 20.06497573852539, 20.808645248413086, 21.552316665649414, 22.29598617553711, 23.039657592773438, 23.783329010009766, 24.52699851989746, 25.27066993713379, 26.014339447021484, 26.758010864257812, 27.50168228149414, 28.24535369873047, 28.989023208618164, 29.732694625854492, 30.476364135742188, 31.220035552978516, 31.963706970214844, 32.70737838745117, 33.451045989990234, 34.19471740722656, 34.93838882446289]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 7.0, 4.0, 7.0, 10.0, 12.0, 13.0, 6.0, 20.0, 14.0, 16.0, 19.0, 34.0, 34.0, 38.0, 49.0, 51.0, 56.0, 61.0, 47.0, 51.0, 56.0, 56.0, 42.0, 35.0, 40.0, 38.0, 37.0, 24.0, 21.0, 13.0, 15.0, 14.0, 11.0, 22.0, 7.0, 8.0, 0.0, 2.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-21.841676712036133, -21.199190139770508, -20.55670166015625, -19.914215087890625, -19.271726608276367, -18.629240036010742, -17.986751556396484, -17.34426498413086, -16.701778411865234, -16.05929183959961, -15.416803359985352, -14.77431583404541, -14.131828308105469, -13.489341735839844, -12.846854209899902, -12.204366683959961, -11.561878204345703, -10.919390678405762, -10.27690315246582, -9.634415626525879, -8.991928100585938, -8.349441528320312, -7.706954002380371, -7.06446647644043, -6.421978950500488, -5.779491424560547, -5.1370038986206055, -4.494516849517822, -3.852029323577881, -3.2095417976379395, -2.567054510116577, -1.9245672225952148, -1.2820816040039062, -0.6395941972732544, 0.002893209457397461, 0.6453806161880493, 1.2878680229187012, 1.9303555488586426, 2.572842836380005, 3.215330123901367, 3.8578176498413086, 4.50030517578125, 5.142792701721191, 5.785279750823975, 6.427767276763916, 7.070254802703857, 7.712741851806641, 8.355229377746582, 8.997716903686523, 9.640204429626465, 10.282691955566406, 10.925179481506348, 11.567667007446289, 12.210153579711914, 12.852641105651855, 13.495128631591797, 14.137616157531738, 14.78010368347168, 15.422591209411621, 16.065078735351562, 16.707565307617188, 17.350053787231445, 17.99254035949707, 18.635028839111328, 19.277515411376953]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 6.0, 6.0, 25.0, 23.0, 46.0, 75.0, 125.0, 218.0, 402.0, 735.0, 1699.0, 4925.0, 26255.0, 3654879.0, 477934.0, 19553.0, 4323.0, 1539.0, 673.0, 340.0, 196.0, 111.0, 60.0, 45.0, 28.0, 18.0, 14.0, 8.0, 5.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.474609375, -2.391937255859375, -2.30926513671875, -2.226593017578125, -2.1439208984375, -2.061248779296875, -1.97857666015625, -1.895904541015625, -1.813232421875, -1.730560302734375, -1.64788818359375, -1.565216064453125, -1.4825439453125, -1.399871826171875, -1.31719970703125, -1.234527587890625, -1.15185546875, -1.069183349609375, -0.98651123046875, -0.903839111328125, -0.8211669921875, -0.738494873046875, -0.65582275390625, -0.573150634765625, -0.490478515625, -0.407806396484375, -0.32513427734375, -0.242462158203125, -0.1597900390625, -0.077117919921875, 0.00555419921875, 0.088226318359375, 0.1708984375, 0.253570556640625, 0.33624267578125, 0.418914794921875, 0.5015869140625, 0.584259033203125, 0.66693115234375, 0.749603271484375, 0.832275390625, 0.914947509765625, 0.99761962890625, 1.080291748046875, 1.1629638671875, 1.245635986328125, 1.32830810546875, 1.410980224609375, 1.49365234375, 1.576324462890625, 1.65899658203125, 1.741668701171875, 1.8243408203125, 1.907012939453125, 1.98968505859375, 2.072357177734375, 2.155029296875, 2.237701416015625, 2.32037353515625, 2.403045654296875, 2.4857177734375, 2.568389892578125, 2.65106201171875, 2.733734130859375, 2.81640625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 4.0, 6.0, 9.0, 9.0, 11.0, 16.0, 14.0, 22.0, 35.0, 37.0, 47.0, 45.0, 56.0, 66.0, 69.0, 61.0, 72.0, 51.0, 60.0, 68.0, 65.0, 61.0, 31.0, 20.0, 17.0, 21.0, 14.0, 6.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81494140625, -0.7792434692382812, -0.7435455322265625, -0.7078475952148438, -0.672149658203125, -0.6364517211914062, -0.6007537841796875, -0.5650558471679688, -0.52935791015625, -0.49365997314453125, -0.4579620361328125, -0.42226409912109375, -0.386566162109375, -0.35086822509765625, -0.3151702880859375, -0.27947235107421875, -0.2437744140625, -0.20807647705078125, -0.1723785400390625, -0.13668060302734375, -0.100982666015625, -0.06528472900390625, -0.0295867919921875, 0.00611114501953125, 0.04180908203125, 0.07750701904296875, 0.1132049560546875, 0.14890289306640625, 0.184600830078125, 0.22029876708984375, 0.2559967041015625, 0.29169464111328125, 0.327392578125, 0.36309051513671875, 0.3987884521484375, 0.43448638916015625, 0.470184326171875, 0.5058822631835938, 0.5415802001953125, 0.5772781372070312, 0.61297607421875, 0.6486740112304688, 0.6843719482421875, 0.7200698852539062, 0.755767822265625, 0.7914657592773438, 0.8271636962890625, 0.8628616333007812, 0.8985595703125, 0.9342575073242188, 0.9699554443359375, 1.0056533813476562, 1.041351318359375, 1.0770492553710938, 1.1127471923828125, 1.1484451293945312, 1.18414306640625, 1.2198410034179688, 1.2555389404296875, 1.2912368774414062, 1.326934814453125, 1.3626327514648438, 1.3983306884765625, 1.4340286254882812, 1.4697265625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 6.0, 12.0, 15.0, 11.0, 9.0, 16.0, 27.0, 38.0, 28.0, 52.0, 60.0, 82.0, 112.0, 134.0, 203.0, 283.0, 383.0, 593.0, 985.0, 1901.0, 3765.0, 9322.0, 30071.0, 202542.0, 3762761.0, 139438.0, 25104.0, 8136.0, 3531.0, 1701.0, 915.0, 572.0, 362.0, 275.0, 199.0, 161.0, 95.0, 74.0, 62.0, 46.0, 42.0, 35.0, 20.0, 25.0, 19.0, 20.0, 9.0, 6.0, 8.0, 7.0, 7.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.216796875, -1.1768035888671875, -1.136810302734375, -1.0968170166015625, -1.05682373046875, -1.0168304443359375, -0.976837158203125, -0.9368438720703125, -0.8968505859375, -0.8568572998046875, -0.816864013671875, -0.7768707275390625, -0.73687744140625, -0.6968841552734375, -0.656890869140625, -0.6168975830078125, -0.576904296875, -0.5369110107421875, -0.496917724609375, -0.4569244384765625, -0.41693115234375, -0.3769378662109375, -0.336944580078125, -0.2969512939453125, -0.2569580078125, -0.2169647216796875, -0.176971435546875, -0.1369781494140625, -0.09698486328125, -0.0569915771484375, -0.016998291015625, 0.0229949951171875, 0.06298828125, 0.1029815673828125, 0.142974853515625, 0.1829681396484375, 0.22296142578125, 0.2629547119140625, 0.302947998046875, 0.3429412841796875, 0.3829345703125, 0.4229278564453125, 0.462921142578125, 0.5029144287109375, 0.54290771484375, 0.5829010009765625, 0.622894287109375, 0.6628875732421875, 0.702880859375, 0.7428741455078125, 0.782867431640625, 0.8228607177734375, 0.86285400390625, 0.9028472900390625, 0.942840576171875, 0.9828338623046875, 1.0228271484375, 1.0628204345703125, 1.102813720703125, 1.1428070068359375, 1.18280029296875, 1.2227935791015625, 1.262786865234375, 1.3027801513671875, 1.3427734375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 6.0, 19.0, 40.0, 115.0, 587.0, 2989.0, 172.0, 70.0, 31.0, 11.0, 10.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.517578125, -0.499847412109375, -0.48211669921875, -0.464385986328125, -0.4466552734375, -0.428924560546875, -0.41119384765625, -0.393463134765625, -0.375732421875, -0.358001708984375, -0.34027099609375, -0.322540283203125, -0.3048095703125, -0.287078857421875, -0.26934814453125, -0.251617431640625, -0.23388671875, -0.216156005859375, -0.19842529296875, -0.180694580078125, -0.1629638671875, -0.145233154296875, -0.12750244140625, -0.109771728515625, -0.092041015625, -0.074310302734375, -0.05657958984375, -0.038848876953125, -0.0211181640625, -0.003387451171875, 0.01434326171875, 0.032073974609375, 0.0498046875, 0.067535400390625, 0.08526611328125, 0.102996826171875, 0.1207275390625, 0.138458251953125, 0.15618896484375, 0.173919677734375, 0.191650390625, 0.209381103515625, 0.22711181640625, 0.244842529296875, 0.2625732421875, 0.280303955078125, 0.29803466796875, 0.315765380859375, 0.33349609375, 0.351226806640625, 0.36895751953125, 0.386688232421875, 0.4044189453125, 0.422149658203125, 0.43988037109375, 0.457611083984375, 0.475341796875, 0.493072509765625, 0.51080322265625, 0.528533935546875, 0.5462646484375, 0.563995361328125, 0.58172607421875, 0.599456787109375, 0.6171875]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 26.0, 49.0, 147.0, 221.0, 267.0, 159.0, 82.0, 27.0, 14.0, 7.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.1609153747558594, -1.076160192489624, -0.9914048910140991, -0.9066497087478638, -0.8218944668769836, -0.7371392250061035, -0.6523840427398682, -0.567628800868988, -0.4828735589981079, -0.3981183171272278, -0.31336310505867004, -0.2286078929901123, -0.14385265111923218, -0.05909740924835205, 0.0256577730178833, 0.11041301488876343, 0.19516825675964355, 0.2799234986305237, 0.3646787106990814, 0.44943392276763916, 0.5341891646385193, 0.6189444065093994, 0.7036995887756348, 0.7884548306465149, 0.873210072517395, 0.9579653143882751, 1.0427205562591553, 1.1274757385253906, 1.212230920791626, 1.2969862222671509, 1.3817414045333862, 1.4664967060089111, 1.5512518882751465, 1.6360070705413818, 1.7207623720169067, 1.805517554283142, 1.890272855758667, 1.9750280380249023, 2.0597832202911377, 2.144538402557373, 2.2292938232421875, 2.314049005508423, 2.398804187774658, 2.4835596084594727, 2.568314790725708, 2.6530699729919434, 2.7378251552581787, 2.822580337524414, 2.9073355197906494, 2.9920907020568848, 3.07684588432312, 3.1616010665893555, 3.24635648727417, 3.3311116695404053, 3.4158668518066406, 3.500622034072876, 3.5853772163391113, 3.6701323986053467, 3.754887580871582, 3.8396430015563965, 3.924398183822632, 4.009153366088867, 4.093908309936523, 4.178663730621338, 4.263419151306152]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 4.0, 4.0, 7.0, 12.0, 11.0, 13.0, 16.0, 19.0, 16.0, 22.0, 19.0, 21.0, 38.0, 36.0, 46.0, 62.0, 34.0, 50.0, 48.0, 46.0, 50.0, 38.0, 43.0, 50.0, 35.0, 40.0, 30.0, 31.0, 33.0, 33.0, 18.0, 9.0, 16.0, 7.0, 6.0, 8.0, 5.0, 8.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.1132023334503174, -1.0839381217956543, -1.0546740293502808, -1.0254098176956177, -0.9961456060409546, -0.9668814539909363, -0.937617301940918, -0.9083530902862549, -0.8790888786315918, -0.8498247265815735, -0.8205605149269104, -0.7912963628768921, -0.762032151222229, -0.7327679991722107, -0.7035038471221924, -0.6742396354675293, -0.644975483417511, -0.6157113313674927, -0.5864471197128296, -0.5571829676628113, -0.5279187560081482, -0.4986546039581299, -0.4693904221057892, -0.4401262402534485, -0.4108620584011078, -0.3815978765487671, -0.3523336946964264, -0.3230695128440857, -0.2938053607940674, -0.2645411491394043, -0.235276997089386, -0.2060128152370453, -0.17674869298934937, -0.14748451113700867, -0.11822033673524857, -0.08895616233348846, -0.059691980481147766, -0.030427798628807068, -0.0011636316776275635, 0.028100550174713135, 0.05736473202705383, 0.08662891387939453, 0.11589308828115463, 0.14515726268291473, 0.17442144453525543, 0.20368562638759613, 0.23294979333877563, 0.26221397519111633, 0.29147815704345703, 0.32074233889579773, 0.3500065207481384, 0.37927067279815674, 0.4085348844528198, 0.43779903650283813, 0.46706321835517883, 0.49632740020751953, 0.5255916118621826, 0.5548557639122009, 0.584119975566864, 0.6133841276168823, 0.6426483392715454, 0.6719124913215637, 0.701176643371582, 0.7304408550262451, 0.7597050070762634]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 3.0, 0.0, 4.0, 6.0, 14.0, 16.0, 26.0, 32.0, 45.0, 66.0, 137.0, 267.0, 574.0, 1434.0, 4306.0, 16298.0, 83633.0, 462245.0, 394236.0, 65918.0, 13313.0, 3533.0, 1311.0, 512.0, 260.0, 147.0, 82.0, 52.0, 39.0, 18.0, 15.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3125, -2.21588134765625, -2.1192626953125, -2.02264404296875, -1.926025390625, -1.82940673828125, -1.7327880859375, -1.63616943359375, -1.53955078125, -1.44293212890625, -1.3463134765625, -1.24969482421875, -1.153076171875, -1.05645751953125, -0.9598388671875, -0.86322021484375, -0.7666015625, -0.66998291015625, -0.5733642578125, -0.47674560546875, -0.380126953125, -0.28350830078125, -0.1868896484375, -0.09027099609375, 0.00634765625, 0.10296630859375, 0.1995849609375, 0.29620361328125, 0.392822265625, 0.48944091796875, 0.5860595703125, 0.68267822265625, 0.779296875, 0.87591552734375, 0.9725341796875, 1.06915283203125, 1.165771484375, 1.26239013671875, 1.3590087890625, 1.45562744140625, 1.55224609375, 1.64886474609375, 1.7454833984375, 1.84210205078125, 1.938720703125, 2.03533935546875, 2.1319580078125, 2.22857666015625, 2.3251953125, 2.42181396484375, 2.5184326171875, 2.61505126953125, 2.711669921875, 2.80828857421875, 2.9049072265625, 3.00152587890625, 3.09814453125, 3.19476318359375, 3.2913818359375, 3.38800048828125, 3.484619140625, 3.58123779296875, 3.6778564453125, 3.77447509765625, 3.87109375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 14.0, 14.0, 16.0, 25.0, 24.0, 46.0, 47.0, 50.0, 54.0, 67.0, 64.0, 81.0, 55.0, 72.0, 59.0, 76.0, 52.0, 44.0, 37.0, 19.0, 20.0, 20.0, 15.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74560546875, -0.7096328735351562, -0.6736602783203125, -0.6376876831054688, -0.601715087890625, -0.5657424926757812, -0.5297698974609375, -0.49379730224609375, -0.45782470703125, -0.42185211181640625, -0.3858795166015625, -0.34990692138671875, -0.313934326171875, -0.27796173095703125, -0.2419891357421875, -0.20601654052734375, -0.1700439453125, -0.13407135009765625, -0.0980987548828125, -0.06212615966796875, -0.026153564453125, 0.00981903076171875, 0.0457916259765625, 0.08176422119140625, 0.11773681640625, 0.15370941162109375, 0.1896820068359375, 0.22565460205078125, 0.261627197265625, 0.29759979248046875, 0.3335723876953125, 0.36954498291015625, 0.405517578125, 0.44149017333984375, 0.4774627685546875, 0.5134353637695312, 0.549407958984375, 0.5853805541992188, 0.6213531494140625, 0.6573257446289062, 0.69329833984375, 0.7292709350585938, 0.7652435302734375, 0.8012161254882812, 0.837188720703125, 0.8731613159179688, 0.9091339111328125, 0.9451065063476562, 0.9810791015625, 1.0170516967773438, 1.0530242919921875, 1.0889968872070312, 1.124969482421875, 1.1609420776367188, 1.1969146728515625, 1.2328872680664062, 1.26885986328125, 1.3048324584960938, 1.3408050537109375, 1.3767776489257812, 1.412750244140625, 1.4487228393554688, 1.4846954345703125, 1.5206680297851562, 1.556640625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 4.0, 6.0, 4.0, 5.0, 9.0, 12.0, 16.0, 23.0, 44.0, 62.0, 109.0, 208.0, 410.0, 918.0, 2399.0, 7624.0, 35363.0, 364373.0, 568695.0, 53028.0, 10105.0, 2970.0, 1119.0, 475.0, 213.0, 127.0, 71.0, 32.0, 32.0, 17.0, 18.0, 15.0, 6.0, 13.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.283203125, -3.177642822265625, -3.07208251953125, -2.966522216796875, -2.8609619140625, -2.755401611328125, -2.64984130859375, -2.544281005859375, -2.438720703125, -2.333160400390625, -2.22760009765625, -2.122039794921875, -2.0164794921875, -1.910919189453125, -1.80535888671875, -1.699798583984375, -1.59423828125, -1.488677978515625, -1.38311767578125, -1.277557373046875, -1.1719970703125, -1.066436767578125, -0.96087646484375, -0.855316162109375, -0.749755859375, -0.644195556640625, -0.53863525390625, -0.433074951171875, -0.3275146484375, -0.221954345703125, -0.11639404296875, -0.010833740234375, 0.0947265625, 0.200286865234375, 0.30584716796875, 0.411407470703125, 0.5169677734375, 0.622528076171875, 0.72808837890625, 0.833648681640625, 0.939208984375, 1.044769287109375, 1.15032958984375, 1.255889892578125, 1.3614501953125, 1.467010498046875, 1.57257080078125, 1.678131103515625, 1.78369140625, 1.889251708984375, 1.99481201171875, 2.100372314453125, 2.2059326171875, 2.311492919921875, 2.41705322265625, 2.522613525390625, 2.628173828125, 2.733734130859375, 2.83929443359375, 2.944854736328125, 3.0504150390625, 3.155975341796875, 3.26153564453125, 3.367095947265625, 3.47265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 5.0, 3.0, 6.0, 1.0, 9.0, 4.0, 6.0, 3.0, 11.0, 21.0, 13.0, 16.0, 25.0, 16.0, 33.0, 34.0, 47.0, 41.0, 45.0, 45.0, 66.0, 47.0, 48.0, 48.0, 49.0, 46.0, 44.0, 29.0, 37.0, 38.0, 29.0, 24.0, 22.0, 12.0, 9.0, 12.0, 18.0, 5.0, 7.0, 8.0, 3.0, 3.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.796875, -3.6689453125, -3.541015625, -3.4130859375, -3.28515625, -3.1572265625, -3.029296875, -2.9013671875, -2.7734375, -2.6455078125, -2.517578125, -2.3896484375, -2.26171875, -2.1337890625, -2.005859375, -1.8779296875, -1.75, -1.6220703125, -1.494140625, -1.3662109375, -1.23828125, -1.1103515625, -0.982421875, -0.8544921875, -0.7265625, -0.5986328125, -0.470703125, -0.3427734375, -0.21484375, -0.0869140625, 0.041015625, 0.1689453125, 0.296875, 0.4248046875, 0.552734375, 0.6806640625, 0.80859375, 0.9365234375, 1.064453125, 1.1923828125, 1.3203125, 1.4482421875, 1.576171875, 1.7041015625, 1.83203125, 1.9599609375, 2.087890625, 2.2158203125, 2.34375, 2.4716796875, 2.599609375, 2.7275390625, 2.85546875, 2.9833984375, 3.111328125, 3.2392578125, 3.3671875, 3.4951171875, 3.623046875, 3.7509765625, 3.87890625, 4.0068359375, 4.134765625, 4.2626953125, 4.390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 4.0, 6.0, 17.0, 14.0, 23.0, 37.0, 63.0, 94.0, 180.0, 449.0, 1374.0, 9583.0, 608953.0, 417898.0, 7853.0, 1189.0, 384.0, 186.0, 90.0, 61.0, 28.0, 22.0, 14.0, 8.0, 8.0, 7.0, 7.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.625, -2.547698974609375, -2.47039794921875, -2.393096923828125, -2.3157958984375, -2.238494873046875, -2.16119384765625, -2.083892822265625, -2.006591796875, -1.929290771484375, -1.85198974609375, -1.774688720703125, -1.6973876953125, -1.620086669921875, -1.54278564453125, -1.465484619140625, -1.38818359375, -1.310882568359375, -1.23358154296875, -1.156280517578125, -1.0789794921875, -1.001678466796875, -0.92437744140625, -0.847076416015625, -0.769775390625, -0.692474365234375, -0.61517333984375, -0.537872314453125, -0.4605712890625, -0.383270263671875, -0.30596923828125, -0.228668212890625, -0.1513671875, -0.074066162109375, 0.00323486328125, 0.080535888671875, 0.1578369140625, 0.235137939453125, 0.31243896484375, 0.389739990234375, 0.467041015625, 0.544342041015625, 0.62164306640625, 0.698944091796875, 0.7762451171875, 0.853546142578125, 0.93084716796875, 1.008148193359375, 1.08544921875, 1.162750244140625, 1.24005126953125, 1.317352294921875, 1.3946533203125, 1.471954345703125, 1.54925537109375, 1.626556396484375, 1.703857421875, 1.781158447265625, 1.85845947265625, 1.935760498046875, 2.0130615234375, 2.090362548828125, 2.16766357421875, 2.244964599609375, 2.322265625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 7.0, 7.0, 26.0, 54.0, 81.0, 136.0, 196.0, 182.0, 143.0, 82.0, 45.0, 27.0, 10.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003333091735839844, -0.00032351166009902954, -0.0003137141466140747, -0.0003039166331291199, -0.00029411911964416504, -0.0002843216061592102, -0.00027452409267425537, -0.00026472657918930054, -0.0002549290657043457, -0.00024513155221939087, -0.00023533403873443604, -0.0002255365252494812, -0.00021573901176452637, -0.00020594149827957153, -0.0001961439847946167, -0.00018634647130966187, -0.00017654895782470703, -0.0001667514443397522, -0.00015695393085479736, -0.00014715641736984253, -0.0001373589038848877, -0.00012756139039993286, -0.00011776387691497803, -0.0001079663634300232, -9.816884994506836e-05, -8.837133646011353e-05, -7.857382297515869e-05, -6.877630949020386e-05, -5.8978796005249023e-05, -4.918128252029419e-05, -3.9383769035339355e-05, -2.958625555038452e-05, -1.9788742065429688e-05, -9.991228580474854e-06, -1.9371509552001953e-07, 9.603798389434814e-06, 1.940131187438965e-05, 2.9198825359344482e-05, 3.8996338844299316e-05, 4.879385232925415e-05, 5.8591365814208984e-05, 6.838887929916382e-05, 7.818639278411865e-05, 8.798390626907349e-05, 9.778141975402832e-05, 0.00010757893323898315, 0.00011737644672393799, 0.00012717396020889282, 0.00013697147369384766, 0.0001467689871788025, 0.00015656650066375732, 0.00016636401414871216, 0.000176161527633667, 0.00018595904111862183, 0.00019575655460357666, 0.0002055540680885315, 0.00021535158157348633, 0.00022514909505844116, 0.000234946608543396, 0.00024474412202835083, 0.00025454163551330566, 0.0002643391489982605, 0.00027413666248321533, 0.00028393417596817017, 0.000293731689453125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 4.0, 10.0, 12.0, 12.0, 36.0, 83.0, 148.0, 357.0, 884.0, 2958.0, 16345.0, 308129.0, 676438.0, 36498.0, 4544.0, 1216.0, 482.0, 211.0, 90.0, 42.0, 23.0, 15.0, 4.0, 3.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.235015869140625, -1.18780517578125, -1.140594482421875, -1.0933837890625, -1.046173095703125, -0.99896240234375, -0.951751708984375, -0.904541015625, -0.857330322265625, -0.81011962890625, -0.762908935546875, -0.7156982421875, -0.668487548828125, -0.62127685546875, -0.574066162109375, -0.52685546875, -0.479644775390625, -0.43243408203125, -0.385223388671875, -0.3380126953125, -0.290802001953125, -0.24359130859375, -0.196380615234375, -0.149169921875, -0.101959228515625, -0.05474853515625, -0.007537841796875, 0.0396728515625, 0.086883544921875, 0.13409423828125, 0.181304931640625, 0.228515625, 0.275726318359375, 0.32293701171875, 0.370147705078125, 0.4173583984375, 0.464569091796875, 0.51177978515625, 0.558990478515625, 0.606201171875, 0.653411865234375, 0.70062255859375, 0.747833251953125, 0.7950439453125, 0.842254638671875, 0.88946533203125, 0.936676025390625, 0.98388671875, 1.031097412109375, 1.07830810546875, 1.125518798828125, 1.1727294921875, 1.219940185546875, 1.26715087890625, 1.314361572265625, 1.361572265625, 1.408782958984375, 1.45599365234375, 1.503204345703125, 1.5504150390625, 1.597625732421875, 1.64483642578125, 1.692047119140625, 1.7392578125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 10.0, 13.0, 20.0, 31.0, 53.0, 73.0, 99.0, 120.0, 114.0, 130.0, 117.0, 85.0, 46.0, 26.0, 17.0, 8.0, 9.0, 9.0, 6.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.927734375, -1.86834716796875, -1.8089599609375, -1.74957275390625, -1.690185546875, -1.63079833984375, -1.5714111328125, -1.51202392578125, -1.45263671875, -1.39324951171875, -1.3338623046875, -1.27447509765625, -1.215087890625, -1.15570068359375, -1.0963134765625, -1.03692626953125, -0.9775390625, -0.91815185546875, -0.8587646484375, -0.79937744140625, -0.739990234375, -0.68060302734375, -0.6212158203125, -0.56182861328125, -0.50244140625, -0.44305419921875, -0.3836669921875, -0.32427978515625, -0.264892578125, -0.20550537109375, -0.1461181640625, -0.08673095703125, -0.02734375, 0.03204345703125, 0.0914306640625, 0.15081787109375, 0.210205078125, 0.26959228515625, 0.3289794921875, 0.38836669921875, 0.44775390625, 0.50714111328125, 0.5665283203125, 0.62591552734375, 0.685302734375, 0.74468994140625, 0.8040771484375, 0.86346435546875, 0.9228515625, 0.98223876953125, 1.0416259765625, 1.10101318359375, 1.160400390625, 1.21978759765625, 1.2791748046875, 1.33856201171875, 1.39794921875, 1.45733642578125, 1.5167236328125, 1.57611083984375, 1.635498046875, 1.69488525390625, 1.7542724609375, 1.81365966796875, 1.873046875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 5.0, 9.0, 40.0, 96.0, 189.0, 269.0, 205.0, 108.0, 46.0, 27.0, 8.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.424991607666016, -49.2414665222168, -48.05793762207031, -46.874412536621094, -45.690887451171875, -44.50735855102539, -43.32383346557617, -42.14030456542969, -40.95677947998047, -39.77325439453125, -38.589725494384766, -37.40620040893555, -36.22267150878906, -35.039146423339844, -33.855621337890625, -32.672096252441406, -31.488567352294922, -30.30504035949707, -29.12151336669922, -27.93798828125, -26.75446128845215, -25.570934295654297, -24.387409210205078, -23.203882217407227, -22.020355224609375, -20.836828231811523, -19.653301239013672, -18.469776153564453, -17.2862491607666, -16.10272216796875, -14.919196128845215, -13.73567008972168, -12.552139282226562, -11.368612289428711, -10.185086250305176, -9.00156021118164, -7.818033218383789, -6.634506702423096, -5.450980186462402, -4.267454147338867, -3.0839271545410156, -1.9004006385803223, -0.7168741226196289, 0.46665239334106445, 1.6501789093017578, 2.833705425262451, 4.0172319412231445, 5.20075798034668, 6.384284973144531, 7.567811489105225, 8.751338005065918, 9.934864044189453, 11.118391036987305, 12.301918029785156, 13.485444068908691, 14.668970108032227, 15.852497100830078, 17.03602409362793, 18.21955108642578, 19.403076171875, 20.58660316467285, 21.770130157470703, 22.953655242919922, 24.137182235717773, 25.320709228515625]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 4.0, 5.0, 17.0, 15.0, 18.0, 21.0, 19.0, 25.0, 32.0, 30.0, 37.0, 36.0, 49.0, 46.0, 58.0, 79.0, 60.0, 46.0, 49.0, 49.0, 49.0, 37.0, 34.0, 33.0, 19.0, 16.0, 23.0, 21.0, 19.0, 8.0, 12.0, 5.0, 6.0, 6.0, 2.0, 2.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.423269271850586, -24.696413040161133, -23.96955680847168, -23.242700576782227, -22.515844345092773, -21.78898811340332, -21.062129974365234, -20.33527374267578, -19.608417510986328, -18.881561279296875, -18.154705047607422, -17.42784881591797, -16.700992584228516, -15.974136352539062, -15.247279167175293, -14.52042293548584, -13.793567657470703, -13.06671142578125, -12.339855194091797, -11.612998962402344, -10.88614273071289, -10.159286499023438, -9.432429313659668, -8.705573081970215, -7.978716850280762, -7.251860618591309, -6.5250043869018555, -5.798147678375244, -5.071291446685791, -4.344435214996338, -3.6175785064697266, -2.8907222747802734, -2.163867950439453, -1.4370115995407104, -0.7101552486419678, 0.016701221466064453, 0.7435574531555176, 1.4704136848449707, 2.197270393371582, 2.924126625061035, 3.6509828567504883, 4.377839088439941, 5.1046953201293945, 5.831552028656006, 6.558408260345459, 7.285264492034912, 8.012121200561523, 8.738977432250977, 9.46583366394043, 10.192689895629883, 10.919546127319336, 11.646402359008789, 12.373258590698242, 13.100114822387695, 13.826972007751465, 14.553828239440918, 15.280684471130371, 16.00754165649414, 16.734397888183594, 17.461254119873047, 18.1881103515625, 18.914966583251953, 19.641822814941406, 20.36867904663086, 21.095535278320312]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 7.0, 14.0, 14.0, 23.0, 16.0, 46.0, 60.0, 99.0, 191.0, 348.0, 743.0, 1848.0, 5436.0, 28641.0, 3661454.0, 468186.0, 20175.0, 4326.0, 1433.0, 607.0, 257.0, 142.0, 97.0, 45.0, 26.0, 18.0, 6.0, 5.0, 4.0, 6.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.646484375, -3.55029296875, -3.4541015625, -3.35791015625, -3.26171875, -3.16552734375, -3.0693359375, -2.97314453125, -2.876953125, -2.78076171875, -2.6845703125, -2.58837890625, -2.4921875, -2.39599609375, -2.2998046875, -2.20361328125, -2.107421875, -2.01123046875, -1.9150390625, -1.81884765625, -1.72265625, -1.62646484375, -1.5302734375, -1.43408203125, -1.337890625, -1.24169921875, -1.1455078125, -1.04931640625, -0.953125, -0.85693359375, -0.7607421875, -0.66455078125, -0.568359375, -0.47216796875, -0.3759765625, -0.27978515625, -0.18359375, -0.08740234375, 0.0087890625, 0.10498046875, 0.201171875, 0.29736328125, 0.3935546875, 0.48974609375, 0.5859375, 0.68212890625, 0.7783203125, 0.87451171875, 0.970703125, 1.06689453125, 1.1630859375, 1.25927734375, 1.35546875, 1.45166015625, 1.5478515625, 1.64404296875, 1.740234375, 1.83642578125, 1.9326171875, 2.02880859375, 2.125, 2.22119140625, 2.3173828125, 2.41357421875, 2.509765625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 4.0, 4.0, 6.0, 8.0, 10.0, 14.0, 20.0, 36.0, 45.0, 67.0, 62.0, 69.0, 79.0, 87.0, 89.0, 83.0, 76.0, 58.0, 65.0, 45.0, 26.0, 16.0, 12.0, 14.0, 9.0, 5.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5703125, -1.5210723876953125, -1.471832275390625, -1.4225921630859375, -1.37335205078125, -1.3241119384765625, -1.274871826171875, -1.2256317138671875, -1.1763916015625, -1.1271514892578125, -1.077911376953125, -1.0286712646484375, -0.97943115234375, -0.9301910400390625, -0.880950927734375, -0.8317108154296875, -0.782470703125, -0.7332305908203125, -0.683990478515625, -0.6347503662109375, -0.58551025390625, -0.5362701416015625, -0.487030029296875, -0.4377899169921875, -0.3885498046875, -0.3393096923828125, -0.290069580078125, -0.2408294677734375, -0.19158935546875, -0.1423492431640625, -0.093109130859375, -0.0438690185546875, 0.00537109375, 0.0546112060546875, 0.103851318359375, 0.1530914306640625, 0.20233154296875, 0.2515716552734375, 0.300811767578125, 0.3500518798828125, 0.3992919921875, 0.4485321044921875, 0.497772216796875, 0.5470123291015625, 0.59625244140625, 0.6454925537109375, 0.694732666015625, 0.7439727783203125, 0.793212890625, 0.8424530029296875, 0.891693115234375, 0.9409332275390625, 0.99017333984375, 1.0394134521484375, 1.088653564453125, 1.1378936767578125, 1.1871337890625, 1.2363739013671875, 1.285614013671875, 1.3348541259765625, 1.38409423828125, 1.4333343505859375, 1.482574462890625, 1.5318145751953125, 1.5810546875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 1.0, 0.0, 7.0, 5.0, 1.0, 12.0, 12.0, 10.0, 18.0, 19.0, 28.0, 42.0, 55.0, 77.0, 109.0, 159.0, 212.0, 299.0, 491.0, 636.0, 1169.0, 2054.0, 3857.0, 9744.0, 32959.0, 206267.0, 3663942.0, 218725.0, 34016.0, 9921.0, 3988.0, 2029.0, 1205.0, 721.0, 444.0, 301.0, 205.0, 148.0, 113.0, 68.0, 70.0, 42.0, 33.0, 20.0, 12.0, 12.0, 9.0, 4.0, 8.0, 6.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.470703125, -1.420867919921875, -1.37103271484375, -1.321197509765625, -1.2713623046875, -1.221527099609375, -1.17169189453125, -1.121856689453125, -1.072021484375, -1.022186279296875, -0.97235107421875, -0.922515869140625, -0.8726806640625, -0.822845458984375, -0.77301025390625, -0.723175048828125, -0.67333984375, -0.623504638671875, -0.57366943359375, -0.523834228515625, -0.4739990234375, -0.424163818359375, -0.37432861328125, -0.324493408203125, -0.274658203125, -0.224822998046875, -0.17498779296875, -0.125152587890625, -0.0753173828125, -0.025482177734375, 0.02435302734375, 0.074188232421875, 0.1240234375, 0.173858642578125, 0.22369384765625, 0.273529052734375, 0.3233642578125, 0.373199462890625, 0.42303466796875, 0.472869873046875, 0.522705078125, 0.572540283203125, 0.62237548828125, 0.672210693359375, 0.7220458984375, 0.771881103515625, 0.82171630859375, 0.871551513671875, 0.92138671875, 0.971221923828125, 1.02105712890625, 1.070892333984375, 1.1207275390625, 1.170562744140625, 1.22039794921875, 1.270233154296875, 1.320068359375, 1.369903564453125, 1.41973876953125, 1.469573974609375, 1.5194091796875, 1.569244384765625, 1.61907958984375, 1.668914794921875, 1.71875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 7.0, 5.0, 16.0, 37.0, 39.0, 101.0, 322.0, 2807.0, 466.0, 141.0, 59.0, 22.0, 19.0, 8.0, 3.0, 5.0, 2.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6363296508789062, -0.6115264892578125, -0.5867233276367188, -0.561920166015625, -0.5371170043945312, -0.5123138427734375, -0.48751068115234375, -0.46270751953125, -0.43790435791015625, -0.4131011962890625, -0.38829803466796875, -0.363494873046875, -0.33869171142578125, -0.3138885498046875, -0.28908538818359375, -0.2642822265625, -0.23947906494140625, -0.2146759033203125, -0.18987274169921875, -0.165069580078125, -0.14026641845703125, -0.1154632568359375, -0.09066009521484375, -0.06585693359375, -0.04105377197265625, -0.0162506103515625, 0.00855255126953125, 0.033355712890625, 0.05815887451171875, 0.0829620361328125, 0.10776519775390625, 0.132568359375, 0.15737152099609375, 0.1821746826171875, 0.20697784423828125, 0.231781005859375, 0.25658416748046875, 0.2813873291015625, 0.30619049072265625, 0.33099365234375, 0.35579681396484375, 0.3805999755859375, 0.40540313720703125, 0.430206298828125, 0.45500946044921875, 0.4798126220703125, 0.5046157836914062, 0.5294189453125, 0.5542221069335938, 0.5790252685546875, 0.6038284301757812, 0.628631591796875, 0.6534347534179688, 0.6782379150390625, 0.7030410766601562, 0.72784423828125, 0.7526473999023438, 0.7774505615234375, 0.8022537231445312, 0.827056884765625, 0.8518600463867188, 0.8766632080078125, 0.9014663696289062, 0.92626953125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 11.0, 24.0, 79.0, 173.0, 234.0, 210.0, 154.0, 80.0, 30.0, 9.0, 7.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.9466633796691895, -6.815336227416992, -6.684009552001953, -6.552682399749756, -6.421355724334717, -6.2900285720825195, -6.1587018966674805, -6.027374744415283, -5.896047592163086, -5.764720439910889, -5.63339376449585, -5.502066612243652, -5.370739936828613, -5.239412784576416, -5.108085632324219, -4.97675895690918, -4.845432281494141, -4.714105129241943, -4.582778453826904, -4.451451301574707, -4.320124626159668, -4.188797473907471, -4.057470321655273, -3.9261436462402344, -3.794816493988037, -3.663489580154419, -3.532162666320801, -3.4008355140686035, -3.2695086002349854, -3.138181686401367, -3.006854772567749, -2.875527858734131, -2.7442007064819336, -2.6128737926483154, -2.4815468788146973, -2.3502197265625, -2.218892812728882, -2.0875658988952637, -1.9562389850616455, -1.8249120712280273, -1.6935850381851196, -1.5622581243515015, -1.4309310913085938, -1.2996041774749756, -1.1682772636413574, -1.0369502305984497, -0.9056233167648315, -0.7742963433265686, -0.6429693698883057, -0.5116423964500427, -0.3803154528141022, -0.24898850917816162, -0.11766153573989868, 0.013665437698364258, 0.14499235153198242, 0.27631932497024536, 0.4076462984085083, 0.5389732718467712, 0.6703002452850342, 0.8016271591186523, 0.9329541325569153, 1.0642811059951782, 1.1956080198287964, 1.326935052871704, 1.4582619667053223]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 2.0, 5.0, 4.0, 10.0, 7.0, 2.0, 8.0, 11.0, 16.0, 20.0, 12.0, 22.0, 20.0, 17.0, 27.0, 37.0, 27.0, 36.0, 37.0, 42.0, 38.0, 49.0, 52.0, 41.0, 35.0, 43.0, 42.0, 30.0, 31.0, 28.0, 34.0, 33.0, 25.0, 12.0, 24.0, 23.0, 18.0, 13.0, 11.0, 8.0, 11.0, 5.0, 7.0, 9.0, 9.0, 2.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1455799341201782, -1.1064914464950562, -1.067402958869934, -1.028314471244812, -0.9892260432243347, -0.9501375555992126, -0.9110491275787354, -0.8719606399536133, -0.8328721523284912, -0.7937836647033691, -0.7546951770782471, -0.7156067490577698, -0.6765182614326477, -0.6374297738075256, -0.5983413457870483, -0.5592528581619263, -0.5201643705368042, -0.48107588291168213, -0.44198742508888245, -0.40289896726608276, -0.3638104796409607, -0.3247219920158386, -0.28563353419303894, -0.24654507637023926, -0.2074565887451172, -0.1683681160211563, -0.12927964329719543, -0.09019117057323456, -0.05110269784927368, -0.012014225125312805, 0.02707424759864807, 0.06616270542144775, 0.10525107383728027, 0.14433954656124115, 0.18342801928520203, 0.2225164920091629, 0.2616049647331238, 0.30069345235824585, 0.33978191018104553, 0.3788703680038452, 0.4179588556289673, 0.45704734325408936, 0.49613580107688904, 0.5352242588996887, 0.5743127465248108, 0.6134012341499329, 0.6524896621704102, 0.6915781497955322, 0.7306666374206543, 0.7697551250457764, 0.8088436126708984, 0.8479320406913757, 0.8870205283164978, 0.9261090159416199, 0.9651974439620972, 1.0042859315872192, 1.0433744192123413, 1.0824629068374634, 1.1215513944625854, 1.1606398820877075, 1.19972825050354, 1.238816738128662, 1.2779052257537842, 1.3169937133789062, 1.3560822010040283]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 4.0, 7.0, 15.0, 16.0, 24.0, 48.0, 57.0, 114.0, 249.0, 494.0, 1292.0, 4449.0, 22522.0, 163571.0, 642807.0, 181472.0, 24108.0, 4912.0, 1395.0, 502.0, 220.0, 110.0, 68.0, 37.0, 25.0, 12.0, 11.0, 11.0, 4.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9716796875, -1.8841400146484375, -1.796600341796875, -1.7090606689453125, -1.62152099609375, -1.5339813232421875, -1.446441650390625, -1.3589019775390625, -1.2713623046875, -1.1838226318359375, -1.096282958984375, -1.0087432861328125, -0.92120361328125, -0.8336639404296875, -0.746124267578125, -0.6585845947265625, -0.571044921875, -0.4835052490234375, -0.395965576171875, -0.3084259033203125, -0.22088623046875, -0.1333465576171875, -0.045806884765625, 0.0417327880859375, 0.1292724609375, 0.2168121337890625, 0.304351806640625, 0.3918914794921875, 0.47943115234375, 0.5669708251953125, 0.654510498046875, 0.7420501708984375, 0.82958984375, 0.9171295166015625, 1.004669189453125, 1.0922088623046875, 1.17974853515625, 1.2672882080078125, 1.354827880859375, 1.4423675537109375, 1.5299072265625, 1.6174468994140625, 1.704986572265625, 1.7925262451171875, 1.88006591796875, 1.9676055908203125, 2.055145263671875, 2.1426849365234375, 2.230224609375, 2.3177642822265625, 2.405303955078125, 2.4928436279296875, 2.58038330078125, 2.6679229736328125, 2.755462646484375, 2.8430023193359375, 2.9305419921875, 3.0180816650390625, 3.105621337890625, 3.1931610107421875, 3.28070068359375, 3.3682403564453125, 3.455780029296875, 3.5433197021484375, 3.630859375]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 6.0, 8.0, 9.0, 13.0, 25.0, 30.0, 53.0, 47.0, 74.0, 62.0, 75.0, 94.0, 92.0, 78.0, 71.0, 67.0, 58.0, 43.0, 30.0, 19.0, 18.0, 6.0, 10.0, 10.0, 3.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.46875, -1.42138671875, -1.3740234375, -1.32666015625, -1.279296875, -1.23193359375, -1.1845703125, -1.13720703125, -1.08984375, -1.04248046875, -0.9951171875, -0.94775390625, -0.900390625, -0.85302734375, -0.8056640625, -0.75830078125, -0.7109375, -0.66357421875, -0.6162109375, -0.56884765625, -0.521484375, -0.47412109375, -0.4267578125, -0.37939453125, -0.33203125, -0.28466796875, -0.2373046875, -0.18994140625, -0.142578125, -0.09521484375, -0.0478515625, -0.00048828125, 0.046875, 0.09423828125, 0.1416015625, 0.18896484375, 0.236328125, 0.28369140625, 0.3310546875, 0.37841796875, 0.42578125, 0.47314453125, 0.5205078125, 0.56787109375, 0.615234375, 0.66259765625, 0.7099609375, 0.75732421875, 0.8046875, 0.85205078125, 0.8994140625, 0.94677734375, 0.994140625, 1.04150390625, 1.0888671875, 1.13623046875, 1.18359375, 1.23095703125, 1.2783203125, 1.32568359375, 1.373046875, 1.42041015625, 1.4677734375, 1.51513671875, 1.5625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 7.0, 7.0, 2.0, 8.0, 5.0, 11.0, 27.0, 23.0, 39.0, 55.0, 110.0, 226.0, 499.0, 1466.0, 6261.0, 68375.0, 848584.0, 111537.0, 8374.0, 1702.0, 578.0, 286.0, 140.0, 72.0, 49.0, 29.0, 20.0, 18.0, 12.0, 8.0, 11.0, 3.0, 2.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.48828125, -3.3662109375, -3.244140625, -3.1220703125, -3.0, -2.8779296875, -2.755859375, -2.6337890625, -2.51171875, -2.3896484375, -2.267578125, -2.1455078125, -2.0234375, -1.9013671875, -1.779296875, -1.6572265625, -1.53515625, -1.4130859375, -1.291015625, -1.1689453125, -1.046875, -0.9248046875, -0.802734375, -0.6806640625, -0.55859375, -0.4365234375, -0.314453125, -0.1923828125, -0.0703125, 0.0517578125, 0.173828125, 0.2958984375, 0.41796875, 0.5400390625, 0.662109375, 0.7841796875, 0.90625, 1.0283203125, 1.150390625, 1.2724609375, 1.39453125, 1.5166015625, 1.638671875, 1.7607421875, 1.8828125, 2.0048828125, 2.126953125, 2.2490234375, 2.37109375, 2.4931640625, 2.615234375, 2.7373046875, 2.859375, 2.9814453125, 3.103515625, 3.2255859375, 3.34765625, 3.4697265625, 3.591796875, 3.7138671875, 3.8359375, 3.9580078125, 4.080078125, 4.2021484375, 4.32421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 5.0, 10.0, 12.0, 16.0, 16.0, 15.0, 12.0, 23.0, 22.0, 32.0, 32.0, 50.0, 44.0, 52.0, 49.0, 59.0, 50.0, 56.0, 63.0, 56.0, 44.0, 46.0, 22.0, 30.0, 27.0, 23.0, 17.0, 20.0, 16.0, 14.0, 14.0, 12.0, 9.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.12109375, -3.99273681640625, -3.8643798828125, -3.73602294921875, -3.607666015625, -3.47930908203125, -3.3509521484375, -3.22259521484375, -3.09423828125, -2.96588134765625, -2.8375244140625, -2.70916748046875, -2.580810546875, -2.45245361328125, -2.3240966796875, -2.19573974609375, -2.0673828125, -1.93902587890625, -1.8106689453125, -1.68231201171875, -1.553955078125, -1.42559814453125, -1.2972412109375, -1.16888427734375, -1.04052734375, -0.91217041015625, -0.7838134765625, -0.65545654296875, -0.527099609375, -0.39874267578125, -0.2703857421875, -0.14202880859375, -0.013671875, 0.11468505859375, 0.2430419921875, 0.37139892578125, 0.499755859375, 0.62811279296875, 0.7564697265625, 0.88482666015625, 1.01318359375, 1.14154052734375, 1.2698974609375, 1.39825439453125, 1.526611328125, 1.65496826171875, 1.7833251953125, 1.91168212890625, 2.0400390625, 2.16839599609375, 2.2967529296875, 2.42510986328125, 2.553466796875, 2.68182373046875, 2.8101806640625, 2.93853759765625, 3.06689453125, 3.19525146484375, 3.3236083984375, 3.45196533203125, 3.580322265625, 3.70867919921875, 3.8370361328125, 3.96539306640625, 4.09375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 8.0, 10.0, 13.0, 22.0, 37.0, 102.0, 250.0, 790.0, 5530.0, 823292.0, 214685.0, 2918.0, 527.0, 213.0, 77.0, 31.0, 29.0, 16.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.591796875, -2.483245849609375, -2.37469482421875, -2.266143798828125, -2.1575927734375, -2.049041748046875, -1.94049072265625, -1.831939697265625, -1.723388671875, -1.614837646484375, -1.50628662109375, -1.397735595703125, -1.2891845703125, -1.180633544921875, -1.07208251953125, -0.963531494140625, -0.85498046875, -0.746429443359375, -0.63787841796875, -0.529327392578125, -0.4207763671875, -0.312225341796875, -0.20367431640625, -0.095123291015625, 0.013427734375, 0.121978759765625, 0.23052978515625, 0.339080810546875, 0.4476318359375, 0.556182861328125, 0.66473388671875, 0.773284912109375, 0.8818359375, 0.990386962890625, 1.09893798828125, 1.207489013671875, 1.3160400390625, 1.424591064453125, 1.53314208984375, 1.641693115234375, 1.750244140625, 1.858795166015625, 1.96734619140625, 2.075897216796875, 2.1844482421875, 2.292999267578125, 2.40155029296875, 2.510101318359375, 2.61865234375, 2.727203369140625, 2.83575439453125, 2.944305419921875, 3.0528564453125, 3.161407470703125, 3.26995849609375, 3.378509521484375, 3.487060546875, 3.595611572265625, 3.70416259765625, 3.812713623046875, 3.9212646484375, 4.029815673828125, 4.13836669921875, 4.246917724609375, 4.35546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 12.0, 15.0, 13.0, 29.0, 40.0, 45.0, 62.0, 89.0, 120.0, 122.0, 101.0, 82.0, 77.0, 59.0, 42.0, 21.0, 27.0, 12.0, 7.0, 8.0, 9.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.00024402141571044922, -0.00023841951042413712, -0.000232817605137825, -0.0002272156998515129, -0.0002216137945652008, -0.0002160118892788887, -0.0002104099839925766, -0.0002048080787062645, -0.0001992061734199524, -0.0001936042681336403, -0.00018800236284732819, -0.00018240045756101608, -0.00017679855227470398, -0.00017119664698839188, -0.00016559474170207977, -0.00015999283641576767, -0.00015439093112945557, -0.00014878902584314346, -0.00014318712055683136, -0.00013758521527051926, -0.00013198330998420715, -0.00012638140469789505, -0.00012077949941158295, -0.00011517759412527084, -0.00010957568883895874, -0.00010397378355264664, -9.837187826633453e-05, -9.276997298002243e-05, -8.716806769371033e-05, -8.156616240739822e-05, -7.596425712108612e-05, -7.036235183477402e-05, -6.476044654846191e-05, -5.915854126214981e-05, -5.355663597583771e-05, -4.7954730689525604e-05, -4.23528254032135e-05, -3.67509201169014e-05, -3.1149014830589294e-05, -2.554710954427719e-05, -1.9945204257965088e-05, -1.4343298971652985e-05, -8.741393685340881e-06, -3.139488399028778e-06, 2.462416887283325e-06, 8.064322173595428e-06, 1.3666227459907532e-05, 1.9268132746219635e-05, 2.4870038032531738e-05, 3.047194331884384e-05, 3.6073848605155945e-05, 4.167575389146805e-05, 4.727765917778015e-05, 5.2879564464092255e-05, 5.848146975040436e-05, 6.408337503671646e-05, 6.968528032302856e-05, 7.528718560934067e-05, 8.088909089565277e-05, 8.649099618196487e-05, 9.209290146827698e-05, 9.769480675458908e-05, 0.00010329671204090118, 0.00010889861732721329, 0.00011450052261352539]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 10.0, 8.0, 16.0, 23.0, 52.0, 111.0, 298.0, 865.0, 5242.0, 240854.0, 787727.0, 11293.0, 1382.0, 381.0, 140.0, 76.0, 41.0, 16.0, 17.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.685546875, -2.606903076171875, -2.52825927734375, -2.449615478515625, -2.3709716796875, -2.292327880859375, -2.21368408203125, -2.135040283203125, -2.056396484375, -1.977752685546875, -1.89910888671875, -1.820465087890625, -1.7418212890625, -1.663177490234375, -1.58453369140625, -1.505889892578125, -1.42724609375, -1.348602294921875, -1.26995849609375, -1.191314697265625, -1.1126708984375, -1.034027099609375, -0.95538330078125, -0.876739501953125, -0.798095703125, -0.719451904296875, -0.64080810546875, -0.562164306640625, -0.4835205078125, -0.404876708984375, -0.32623291015625, -0.247589111328125, -0.1689453125, -0.090301513671875, -0.01165771484375, 0.066986083984375, 0.1456298828125, 0.224273681640625, 0.30291748046875, 0.381561279296875, 0.460205078125, 0.538848876953125, 0.61749267578125, 0.696136474609375, 0.7747802734375, 0.853424072265625, 0.93206787109375, 1.010711669921875, 1.08935546875, 1.167999267578125, 1.24664306640625, 1.325286865234375, 1.4039306640625, 1.482574462890625, 1.56121826171875, 1.639862060546875, 1.718505859375, 1.797149658203125, 1.87579345703125, 1.954437255859375, 2.0330810546875, 2.111724853515625, 2.19036865234375, 2.269012451171875, 2.34765625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 5.0, 11.0, 34.0, 50.0, 114.0, 167.0, 199.0, 184.0, 114.0, 61.0, 30.0, 13.0, 7.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.740234375, -3.6647186279296875, -3.589202880859375, -3.5136871337890625, -3.43817138671875, -3.3626556396484375, -3.287139892578125, -3.2116241455078125, -3.1361083984375, -3.0605926513671875, -2.985076904296875, -2.9095611572265625, -2.83404541015625, -2.7585296630859375, -2.683013916015625, -2.6074981689453125, -2.531982421875, -2.4564666748046875, -2.380950927734375, -2.3054351806640625, -2.22991943359375, -2.1544036865234375, -2.078887939453125, -2.0033721923828125, -1.9278564453125, -1.8523406982421875, -1.776824951171875, -1.7013092041015625, -1.62579345703125, -1.5502777099609375, -1.474761962890625, -1.3992462158203125, -1.32373046875, -1.2482147216796875, -1.172698974609375, -1.0971832275390625, -1.02166748046875, -0.9461517333984375, -0.870635986328125, -0.7951202392578125, -0.7196044921875, -0.6440887451171875, -0.568572998046875, -0.4930572509765625, -0.41754150390625, -0.3420257568359375, -0.266510009765625, -0.1909942626953125, -0.115478515625, -0.0399627685546875, 0.035552978515625, 0.1110687255859375, 0.18658447265625, 0.2621002197265625, 0.337615966796875, 0.4131317138671875, 0.4886474609375, 0.5641632080078125, 0.639678955078125, 0.7151947021484375, 0.79071044921875, 0.8662261962890625, 0.941741943359375, 1.0172576904296875, 1.0927734375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 13.0, 26.0, 38.0, 73.0, 115.0, 159.0, 188.0, 175.0, 98.0, 50.0, 37.0, 14.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-27.14012908935547, -26.38730812072754, -25.634489059448242, -24.881668090820312, -24.128849029541016, -23.376028060913086, -22.623207092285156, -21.87038803100586, -21.117568969726562, -20.364748001098633, -19.611928939819336, -18.859107971191406, -18.10628890991211, -17.35346794128418, -16.60064697265625, -15.847827911376953, -15.095006942749023, -14.34218692779541, -13.589366912841797, -12.836545944213867, -12.08372688293457, -11.33090591430664, -10.578085899353027, -9.825265884399414, -9.0724458694458, -8.319625854492188, -7.566805839538574, -6.813985347747803, -6.0611653327941895, -5.308345317840576, -4.555524826049805, -3.8027048110961914, -3.0498828887939453, -2.297062873840332, -1.5442426204681396, -0.7914223670959473, -0.038602352142333984, 0.7142176628112793, 1.4670381546020508, 2.219858169555664, 2.9726781845092773, 3.7254981994628906, 4.478318214416504, 5.231138706207275, 5.983958721160889, 6.736778736114502, 7.489599227905273, 8.242419242858887, 8.9952392578125, 9.748059272766113, 10.500879287719727, 11.253700256347656, 12.006519317626953, 12.759340286254883, 13.512160301208496, 14.26498031616211, 15.017800331115723, 15.770620346069336, 16.523441314697266, 17.276260375976562, 18.029081344604492, 18.78190040588379, 19.53472137451172, 20.287540435791016, 21.040361404418945]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 2.0, 3.0, 1.0, 4.0, 6.0, 3.0, 9.0, 6.0, 13.0, 15.0, 15.0, 14.0, 15.0, 22.0, 24.0, 26.0, 37.0, 38.0, 43.0, 18.0, 44.0, 48.0, 42.0, 37.0, 45.0, 41.0, 43.0, 33.0, 36.0, 38.0, 40.0, 45.0, 24.0, 27.0, 18.0, 25.0, 16.0, 13.0, 10.0, 11.0, 10.0, 9.0, 5.0, 6.0, 3.0, 6.0, 4.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-13.674097061157227, -13.221652030944824, -12.769207000732422, -12.316761016845703, -11.8643159866333, -11.411870956420898, -10.959425926208496, -10.506980895996094, -10.054534912109375, -9.602089881896973, -9.14964485168457, -8.697198867797852, -8.24475383758545, -7.792308807373047, -7.3398637771606445, -6.887418270111084, -6.434973239898682, -5.982528209686279, -5.530082702636719, -5.077637672424316, -4.625192165374756, -4.1727471351623535, -3.720301866531372, -3.2678565979003906, -2.815411329269409, -2.3629660606384277, -1.9105207920074463, -1.4580756425857544, -1.005630373954773, -0.553185224533081, -0.10073995590209961, 0.35170531272888184, 0.8041505813598633, 1.2565958499908447, 1.7090411186218262, 2.1614861488342285, 2.613931655883789, 3.0663766860961914, 3.518821954727173, 3.9712672233581543, 4.423712730407715, 4.876157760620117, 5.328603267669678, 5.78104829788208, 6.233493804931641, 6.685938835144043, 7.138383865356445, 7.590829372406006, 8.04327392578125, 8.495718955993652, 8.948163986206055, 9.400609970092773, 9.853055000305176, 10.305500030517578, 10.75794506072998, 11.210390090942383, 11.662836074829102, 12.115281105041504, 12.567726135253906, 13.020172119140625, 13.472617149353027, 13.92506217956543, 14.377507209777832, 14.829952239990234, 15.282398223876953]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 8.0, 9.0, 18.0, 27.0, 38.0, 69.0, 154.0, 397.0, 1741.0, 33614.0, 4145879.0, 10773.0, 1007.0, 301.0, 113.0, 68.0, 35.0, 15.0, 7.0, 5.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.46875, -5.2530517578125, -5.037353515625, -4.8216552734375, -4.60595703125, -4.3902587890625, -4.174560546875, -3.9588623046875, -3.7431640625, -3.5274658203125, -3.311767578125, -3.0960693359375, -2.88037109375, -2.6646728515625, -2.448974609375, -2.2332763671875, -2.017578125, -1.8018798828125, -1.586181640625, -1.3704833984375, -1.15478515625, -0.9390869140625, -0.723388671875, -0.5076904296875, -0.2919921875, -0.0762939453125, 0.139404296875, 0.3551025390625, 0.57080078125, 0.7864990234375, 1.002197265625, 1.2178955078125, 1.43359375, 1.6492919921875, 1.864990234375, 2.0806884765625, 2.29638671875, 2.5120849609375, 2.727783203125, 2.9434814453125, 3.1591796875, 3.3748779296875, 3.590576171875, 3.8062744140625, 4.02197265625, 4.2376708984375, 4.453369140625, 4.6690673828125, 4.884765625, 5.1004638671875, 5.316162109375, 5.5318603515625, 5.74755859375, 5.9632568359375, 6.178955078125, 6.3946533203125, 6.6103515625, 6.8260498046875, 7.041748046875, 7.2574462890625, 7.47314453125, 7.6888427734375, 7.904541015625, 8.1202392578125, 8.3359375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 5.0, 11.0, 12.0, 27.0, 44.0, 49.0, 75.0, 69.0, 92.0, 90.0, 106.0, 75.0, 79.0, 71.0, 67.0, 40.0, 29.0, 21.0, 11.0, 10.0, 6.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9638671875, -1.909820556640625, -1.85577392578125, -1.801727294921875, -1.7476806640625, -1.693634033203125, -1.63958740234375, -1.585540771484375, -1.531494140625, -1.477447509765625, -1.42340087890625, -1.369354248046875, -1.3153076171875, -1.261260986328125, -1.20721435546875, -1.153167724609375, -1.09912109375, -1.045074462890625, -0.99102783203125, -0.936981201171875, -0.8829345703125, -0.828887939453125, -0.77484130859375, -0.720794677734375, -0.666748046875, -0.612701416015625, -0.55865478515625, -0.504608154296875, -0.4505615234375, -0.396514892578125, -0.34246826171875, -0.288421630859375, -0.234375, -0.180328369140625, -0.12628173828125, -0.072235107421875, -0.0181884765625, 0.035858154296875, 0.08990478515625, 0.143951416015625, 0.197998046875, 0.252044677734375, 0.30609130859375, 0.360137939453125, 0.4141845703125, 0.468231201171875, 0.52227783203125, 0.576324462890625, 0.63037109375, 0.684417724609375, 0.73846435546875, 0.792510986328125, 0.8465576171875, 0.900604248046875, 0.95465087890625, 1.008697509765625, 1.062744140625, 1.116790771484375, 1.17083740234375, 1.224884033203125, 1.2789306640625, 1.332977294921875, 1.38702392578125, 1.441070556640625, 1.4951171875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 3.0, 6.0, 14.0, 18.0, 21.0, 24.0, 47.0, 74.0, 107.0, 139.0, 198.0, 309.0, 536.0, 826.0, 1608.0, 3322.0, 8968.0, 34238.0, 335988.0, 3708159.0, 74530.0, 15114.0, 5079.0, 2111.0, 1032.0, 620.0, 407.0, 242.0, 166.0, 113.0, 82.0, 53.0, 39.0, 23.0, 23.0, 13.0, 11.0, 4.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.80859375, -1.7586517333984375, -1.708709716796875, -1.6587677001953125, -1.60882568359375, -1.5588836669921875, -1.508941650390625, -1.4589996337890625, -1.4090576171875, -1.3591156005859375, -1.309173583984375, -1.2592315673828125, -1.20928955078125, -1.1593475341796875, -1.109405517578125, -1.0594635009765625, -1.009521484375, -0.9595794677734375, -0.909637451171875, -0.8596954345703125, -0.80975341796875, -0.7598114013671875, -0.709869384765625, -0.6599273681640625, -0.6099853515625, -0.5600433349609375, -0.510101318359375, -0.4601593017578125, -0.41021728515625, -0.3602752685546875, -0.310333251953125, -0.2603912353515625, -0.21044921875, -0.1605072021484375, -0.110565185546875, -0.0606231689453125, -0.01068115234375, 0.0392608642578125, 0.089202880859375, 0.1391448974609375, 0.1890869140625, 0.2390289306640625, 0.288970947265625, 0.3389129638671875, 0.38885498046875, 0.4387969970703125, 0.488739013671875, 0.5386810302734375, 0.588623046875, 0.6385650634765625, 0.688507080078125, 0.7384490966796875, 0.78839111328125, 0.8383331298828125, 0.888275146484375, 0.9382171630859375, 0.9881591796875, 1.0381011962890625, 1.088043212890625, 1.1379852294921875, 1.18792724609375, 1.2378692626953125, 1.287811279296875, 1.3377532958984375, 1.3876953125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 6.0, 16.0, 29.0, 80.0, 229.0, 2987.0, 461.0, 125.0, 53.0, 29.0, 21.0, 14.0, 5.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.763671875, -0.7434539794921875, -0.723236083984375, -0.7030181884765625, -0.68280029296875, -0.6625823974609375, -0.642364501953125, -0.6221466064453125, -0.6019287109375, -0.5817108154296875, -0.561492919921875, -0.5412750244140625, -0.52105712890625, -0.5008392333984375, -0.480621337890625, -0.4604034423828125, -0.440185546875, -0.4199676513671875, -0.399749755859375, -0.3795318603515625, -0.35931396484375, -0.3390960693359375, -0.318878173828125, -0.2986602783203125, -0.2784423828125, -0.2582244873046875, -0.238006591796875, -0.2177886962890625, -0.19757080078125, -0.1773529052734375, -0.157135009765625, -0.1369171142578125, -0.11669921875, -0.0964813232421875, -0.076263427734375, -0.0560455322265625, -0.03582763671875, -0.0156097412109375, 0.004608154296875, 0.0248260498046875, 0.0450439453125, 0.0652618408203125, 0.085479736328125, 0.1056976318359375, 0.12591552734375, 0.1461334228515625, 0.166351318359375, 0.1865692138671875, 0.206787109375, 0.2270050048828125, 0.247222900390625, 0.2674407958984375, 0.28765869140625, 0.3078765869140625, 0.328094482421875, 0.3483123779296875, 0.3685302734375, 0.3887481689453125, 0.408966064453125, 0.4291839599609375, 0.44940185546875, 0.4696197509765625, 0.489837646484375, 0.5100555419921875, 0.5302734375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 25.0, 48.0, 87.0, 99.0, 167.0, 183.0, 151.0, 97.0, 64.0, 29.0, 21.0, 7.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.023097515106201, -2.952439308166504, -2.8817811012268066, -2.8111228942871094, -2.740464687347412, -2.669806480407715, -2.5991482734680176, -2.5284900665283203, -2.457831859588623, -2.387173652648926, -2.3165154457092285, -2.2458572387695312, -2.175199031829834, -2.1045408248901367, -2.0338826179504395, -1.9632242918014526, -1.8925659656524658, -1.8219077587127686, -1.7512495517730713, -1.680591344833374, -1.6099331378936768, -1.5392749309539795, -1.4686166048049927, -1.3979583978652954, -1.3273001909255981, -1.2566419839859009, -1.1859837770462036, -1.1153255701065063, -1.0446672439575195, -0.974009096622467, -0.903350830078125, -0.8326926231384277, -0.7620344161987305, -0.6913762092590332, -0.6207180023193359, -0.5500597357749939, -0.47940152883529663, -0.40874332189559937, -0.3380850851535797, -0.26742684841156006, -0.1967686414718628, -0.12611041963100433, -0.055452197790145874, 0.015206024050712585, 0.08586424589157104, 0.1565224528312683, 0.22718068957328796, 0.2978389263153076, 0.3684971332550049, 0.43915534019470215, 0.5098135471343994, 0.5804718136787415, 0.6511300206184387, 0.721788227558136, 0.792446494102478, 0.8631047010421753, 0.9337629079818726, 1.0044211149215698, 1.075079321861267, 1.1457375288009644, 1.2163958549499512, 1.2870540618896484, 1.3577122688293457, 1.428370475769043, 1.4990286827087402]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 6.0, 11.0, 17.0, 16.0, 21.0, 13.0, 20.0, 24.0, 34.0, 37.0, 40.0, 32.0, 49.0, 51.0, 48.0, 44.0, 41.0, 59.0, 49.0, 37.0, 44.0, 36.0, 39.0, 40.0, 23.0, 26.0, 18.0, 17.0, 14.0, 12.0, 22.0, 6.0, 15.0, 5.0, 3.0, 9.0, 2.0, 4.0, 1.0, 6.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.147050380706787, -1.1110390424728394, -1.0750278234481812, -1.0390164852142334, -1.0030052661895752, -0.9669939875602722, -0.9309827089309692, -0.8949713706970215, -0.8589601516723633, -0.8229488730430603, -0.7869375944137573, -0.7509263157844543, -0.7149150371551514, -0.6789037585258484, -0.6428924798965454, -0.6068811416625977, -0.5708698630332947, -0.5348585844039917, -0.4988473057746887, -0.46283602714538574, -0.42682474851608276, -0.3908134698867798, -0.3548021614551544, -0.31879088282585144, -0.28277960419654846, -0.24676832556724548, -0.2107570469379425, -0.17474575340747833, -0.13873447477817535, -0.10272319614887238, -0.0667119026184082, -0.030700623989105225, 0.005310654640197754, 0.04132193699479103, 0.07733321934938431, 0.11334450542926788, 0.14935578405857086, 0.18536706268787384, 0.221378356218338, 0.257389634847641, 0.29340091347694397, 0.32941219210624695, 0.3654234707355499, 0.4014347791671753, 0.43744605779647827, 0.47345733642578125, 0.5094686150550842, 0.5454798936843872, 0.5814911723136902, 0.6175024509429932, 0.6535137295722961, 0.6895250082015991, 0.7255362868309021, 0.7615475654602051, 0.7975589036941528, 0.833570122718811, 0.8695814609527588, 0.9055927395820618, 0.9416040182113647, 0.9776152968406677, 1.0136265754699707, 1.0496379137039185, 1.0856491327285767, 1.1216604709625244, 1.1576716899871826]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 9.0, 17.0, 23.0, 43.0, 89.0, 149.0, 321.0, 822.0, 2472.0, 11229.0, 88295.0, 653543.0, 259000.0, 25560.0, 4638.0, 1275.0, 527.0, 241.0, 124.0, 77.0, 34.0, 14.0, 13.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.169921875, -3.090118408203125, -3.01031494140625, -2.930511474609375, -2.8507080078125, -2.770904541015625, -2.69110107421875, -2.611297607421875, -2.531494140625, -2.451690673828125, -2.37188720703125, -2.292083740234375, -2.2122802734375, -2.132476806640625, -2.05267333984375, -1.972869873046875, -1.89306640625, -1.813262939453125, -1.73345947265625, -1.653656005859375, -1.5738525390625, -1.494049072265625, -1.41424560546875, -1.334442138671875, -1.254638671875, -1.174835205078125, -1.09503173828125, -1.015228271484375, -0.9354248046875, -0.855621337890625, -0.77581787109375, -0.696014404296875, -0.6162109375, -0.536407470703125, -0.45660400390625, -0.376800537109375, -0.2969970703125, -0.217193603515625, -0.13739013671875, -0.057586669921875, 0.022216796875, 0.102020263671875, 0.18182373046875, 0.261627197265625, 0.3414306640625, 0.421234130859375, 0.50103759765625, 0.580841064453125, 0.66064453125, 0.740447998046875, 0.82025146484375, 0.900054931640625, 0.9798583984375, 1.059661865234375, 1.13946533203125, 1.219268798828125, 1.299072265625, 1.378875732421875, 1.45867919921875, 1.538482666015625, 1.6182861328125, 1.698089599609375, 1.77789306640625, 1.857696533203125, 1.9375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 9.0, 12.0, 22.0, 39.0, 49.0, 53.0, 63.0, 73.0, 97.0, 89.0, 85.0, 81.0, 65.0, 76.0, 62.0, 36.0, 24.0, 21.0, 18.0, 7.0, 8.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.802734375, -1.7513427734375, -1.699951171875, -1.6485595703125, -1.59716796875, -1.5457763671875, -1.494384765625, -1.4429931640625, -1.3916015625, -1.3402099609375, -1.288818359375, -1.2374267578125, -1.18603515625, -1.1346435546875, -1.083251953125, -1.0318603515625, -0.98046875, -0.9290771484375, -0.877685546875, -0.8262939453125, -0.77490234375, -0.7235107421875, -0.672119140625, -0.6207275390625, -0.5693359375, -0.5179443359375, -0.466552734375, -0.4151611328125, -0.36376953125, -0.3123779296875, -0.260986328125, -0.2095947265625, -0.158203125, -0.1068115234375, -0.055419921875, -0.0040283203125, 0.04736328125, 0.0987548828125, 0.150146484375, 0.2015380859375, 0.2529296875, 0.3043212890625, 0.355712890625, 0.4071044921875, 0.45849609375, 0.5098876953125, 0.561279296875, 0.6126708984375, 0.6640625, 0.7154541015625, 0.766845703125, 0.8182373046875, 0.86962890625, 0.9210205078125, 0.972412109375, 1.0238037109375, 1.0751953125, 1.1265869140625, 1.177978515625, 1.2293701171875, 1.28076171875, 1.3321533203125, 1.383544921875, 1.4349365234375, 1.486328125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 8.0, 6.0, 3.0, 6.0, 8.0, 3.0, 7.0, 17.0, 22.0, 30.0, 38.0, 60.0, 99.0, 162.0, 309.0, 675.0, 1502.0, 6100.0, 80378.0, 844906.0, 103871.0, 7113.0, 1648.0, 676.0, 350.0, 205.0, 113.0, 74.0, 36.0, 28.0, 25.0, 23.0, 24.0, 11.0, 6.0, 3.0, 6.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.947265625, -2.856689453125, -2.76611328125, -2.675537109375, -2.5849609375, -2.494384765625, -2.40380859375, -2.313232421875, -2.22265625, -2.132080078125, -2.04150390625, -1.950927734375, -1.8603515625, -1.769775390625, -1.67919921875, -1.588623046875, -1.498046875, -1.407470703125, -1.31689453125, -1.226318359375, -1.1357421875, -1.045166015625, -0.95458984375, -0.864013671875, -0.7734375, -0.682861328125, -0.59228515625, -0.501708984375, -0.4111328125, -0.320556640625, -0.22998046875, -0.139404296875, -0.048828125, 0.041748046875, 0.13232421875, 0.222900390625, 0.3134765625, 0.404052734375, 0.49462890625, 0.585205078125, 0.67578125, 0.766357421875, 0.85693359375, 0.947509765625, 1.0380859375, 1.128662109375, 1.21923828125, 1.309814453125, 1.400390625, 1.490966796875, 1.58154296875, 1.672119140625, 1.7626953125, 1.853271484375, 1.94384765625, 2.034423828125, 2.125, 2.215576171875, 2.30615234375, 2.396728515625, 2.4873046875, 2.577880859375, 2.66845703125, 2.759033203125, 2.849609375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 3.0, 1.0, 5.0, 2.0, 8.0, 3.0, 7.0, 14.0, 3.0, 12.0, 27.0, 15.0, 17.0, 21.0, 22.0, 26.0, 37.0, 27.0, 38.0, 35.0, 49.0, 48.0, 44.0, 49.0, 52.0, 41.0, 45.0, 34.0, 30.0, 30.0, 34.0, 29.0, 25.0, 26.0, 22.0, 21.0, 21.0, 16.0, 13.0, 8.0, 9.0, 7.0, 8.0, 6.0, 6.0, 2.0, 1.0, 5.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00390625, -2.906097412109375, -2.80828857421875, -2.710479736328125, -2.6126708984375, -2.514862060546875, -2.41705322265625, -2.319244384765625, -2.221435546875, -2.123626708984375, -2.02581787109375, -1.928009033203125, -1.8302001953125, -1.732391357421875, -1.63458251953125, -1.536773681640625, -1.43896484375, -1.341156005859375, -1.24334716796875, -1.145538330078125, -1.0477294921875, -0.949920654296875, -0.85211181640625, -0.754302978515625, -0.656494140625, -0.558685302734375, -0.46087646484375, -0.363067626953125, -0.2652587890625, -0.167449951171875, -0.06964111328125, 0.028167724609375, 0.1259765625, 0.223785400390625, 0.32159423828125, 0.419403076171875, 0.5172119140625, 0.615020751953125, 0.71282958984375, 0.810638427734375, 0.908447265625, 1.006256103515625, 1.10406494140625, 1.201873779296875, 1.2996826171875, 1.397491455078125, 1.49530029296875, 1.593109130859375, 1.69091796875, 1.788726806640625, 1.88653564453125, 1.984344482421875, 2.0821533203125, 2.179962158203125, 2.27777099609375, 2.375579833984375, 2.473388671875, 2.571197509765625, 2.66900634765625, 2.766815185546875, 2.8646240234375, 2.962432861328125, 3.06024169921875, 3.158050537109375, 3.255859375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 15.0, 24.0, 52.0, 97.0, 432.0, 3174.0, 824155.0, 218032.0, 2041.0, 331.0, 135.0, 28.0, 10.0, 11.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.693359375, -3.600799560546875, -3.50823974609375, -3.415679931640625, -3.3231201171875, -3.230560302734375, -3.13800048828125, -3.045440673828125, -2.952880859375, -2.860321044921875, -2.76776123046875, -2.675201416015625, -2.5826416015625, -2.490081787109375, -2.39752197265625, -2.304962158203125, -2.21240234375, -2.119842529296875, -2.02728271484375, -1.934722900390625, -1.8421630859375, -1.749603271484375, -1.65704345703125, -1.564483642578125, -1.471923828125, -1.379364013671875, -1.28680419921875, -1.194244384765625, -1.1016845703125, -1.009124755859375, -0.91656494140625, -0.824005126953125, -0.7314453125, -0.638885498046875, -0.54632568359375, -0.453765869140625, -0.3612060546875, -0.268646240234375, -0.17608642578125, -0.083526611328125, 0.009033203125, 0.101593017578125, 0.19415283203125, 0.286712646484375, 0.3792724609375, 0.471832275390625, 0.56439208984375, 0.656951904296875, 0.74951171875, 0.842071533203125, 0.93463134765625, 1.027191162109375, 1.1197509765625, 1.212310791015625, 1.30487060546875, 1.397430419921875, 1.489990234375, 1.582550048828125, 1.67510986328125, 1.767669677734375, 1.8602294921875, 1.952789306640625, 2.04534912109375, 2.137908935546875, 2.23046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 2.0, 8.0, 6.0, 13.0, 8.0, 15.0, 13.0, 18.0, 23.0, 23.0, 28.0, 43.0, 38.0, 61.0, 62.0, 81.0, 74.0, 75.0, 68.0, 56.0, 41.0, 37.0, 35.0, 30.0, 25.0, 30.0, 20.0, 13.0, 15.0, 15.0, 10.0, 6.0, 2.0, 4.0, 5.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00010007619857788086, -9.745266288518906e-05, -9.482912719249725e-05, -9.220559149980545e-05, -8.958205580711365e-05, -8.695852011442184e-05, -8.433498442173004e-05, -8.171144872903824e-05, -7.908791303634644e-05, -7.646437734365463e-05, -7.384084165096283e-05, -7.121730595827103e-05, -6.859377026557922e-05, -6.597023457288742e-05, -6.334669888019562e-05, -6.0723163187503815e-05, -5.809962749481201e-05, -5.547609180212021e-05, -5.2852556109428406e-05, -5.02290204167366e-05, -4.76054847240448e-05, -4.4981949031353e-05, -4.2358413338661194e-05, -3.973487764596939e-05, -3.711134195327759e-05, -3.4487806260585785e-05, -3.186427056789398e-05, -2.924073487520218e-05, -2.6617199182510376e-05, -2.3993663489818573e-05, -2.137012779712677e-05, -1.8746592104434967e-05, -1.6123056411743164e-05, -1.3499520719051361e-05, -1.0875985026359558e-05, -8.252449333667755e-06, -5.628913640975952e-06, -3.005377948284149e-06, -3.818422555923462e-07, 2.2416934370994568e-06, 4.86522912979126e-06, 7.488764822483063e-06, 1.0112300515174866e-05, 1.2735836207866669e-05, 1.535937190055847e-05, 1.7982907593250275e-05, 2.0606443285942078e-05, 2.322997897863388e-05, 2.5853514671325684e-05, 2.8477050364017487e-05, 3.110058605670929e-05, 3.372412174940109e-05, 3.6347657442092896e-05, 3.89711931347847e-05, 4.15947288274765e-05, 4.4218264520168304e-05, 4.684180021286011e-05, 4.946533590555191e-05, 5.208887159824371e-05, 5.4712407290935516e-05, 5.733594298362732e-05, 5.995947867631912e-05, 6.258301436901093e-05, 6.520655006170273e-05, 6.783008575439453e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 2.0, 4.0, 12.0, 12.0, 21.0, 30.0, 63.0, 110.0, 258.0, 700.0, 2378.0, 18709.0, 714266.0, 299784.0, 9545.0, 1667.0, 532.0, 216.0, 97.0, 61.0, 36.0, 13.0, 10.0, 7.0, 5.0, 3.0, 7.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-1.822265625, -1.777679443359375, -1.73309326171875, -1.688507080078125, -1.6439208984375, -1.599334716796875, -1.55474853515625, -1.510162353515625, -1.465576171875, -1.420989990234375, -1.37640380859375, -1.331817626953125, -1.2872314453125, -1.242645263671875, -1.19805908203125, -1.153472900390625, -1.10888671875, -1.064300537109375, -1.01971435546875, -0.975128173828125, -0.9305419921875, -0.885955810546875, -0.84136962890625, -0.796783447265625, -0.752197265625, -0.707611083984375, -0.66302490234375, -0.618438720703125, -0.5738525390625, -0.529266357421875, -0.48468017578125, -0.440093994140625, -0.3955078125, -0.350921630859375, -0.30633544921875, -0.261749267578125, -0.2171630859375, -0.172576904296875, -0.12799072265625, -0.083404541015625, -0.038818359375, 0.005767822265625, 0.05035400390625, 0.094940185546875, 0.1395263671875, 0.184112548828125, 0.22869873046875, 0.273284912109375, 0.31787109375, 0.362457275390625, 0.40704345703125, 0.451629638671875, 0.4962158203125, 0.540802001953125, 0.58538818359375, 0.629974365234375, 0.674560546875, 0.719146728515625, 0.76373291015625, 0.808319091796875, 0.8529052734375, 0.897491455078125, 0.94207763671875, 0.986663818359375, 1.03125]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 4.0, 4.0, 8.0, 9.0, 17.0, 23.0, 28.0, 48.0, 57.0, 64.0, 99.0, 103.0, 104.0, 109.0, 92.0, 62.0, 49.0, 35.0, 24.0, 22.0, 12.0, 9.0, 10.0, 6.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2666015625, -1.2359390258789062, -1.2052764892578125, -1.1746139526367188, -1.143951416015625, -1.1132888793945312, -1.0826263427734375, -1.0519638061523438, -1.02130126953125, -0.9906387329101562, -0.9599761962890625, -0.9293136596679688, -0.898651123046875, -0.8679885864257812, -0.8373260498046875, -0.8066635131835938, -0.7760009765625, -0.7453384399414062, -0.7146759033203125, -0.6840133666992188, -0.653350830078125, -0.6226882934570312, -0.5920257568359375, -0.5613632202148438, -0.53070068359375, -0.5000381469726562, -0.4693756103515625, -0.43871307373046875, -0.408050537109375, -0.37738800048828125, -0.3467254638671875, -0.31606292724609375, -0.285400390625, -0.25473785400390625, -0.2240753173828125, -0.19341278076171875, -0.162750244140625, -0.13208770751953125, -0.1014251708984375, -0.07076263427734375, -0.04010009765625, -0.00943756103515625, 0.0212249755859375, 0.05188751220703125, 0.082550048828125, 0.11321258544921875, 0.1438751220703125, 0.17453765869140625, 0.2052001953125, 0.23586273193359375, 0.2665252685546875, 0.29718780517578125, 0.327850341796875, 0.35851287841796875, 0.3891754150390625, 0.41983795166015625, 0.45050048828125, 0.48116302490234375, 0.5118255615234375, 0.5424880981445312, 0.573150634765625, 0.6038131713867188, 0.6344757080078125, 0.6651382446289062, 0.69580078125]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 15.0, 38.0, 232.0, 465.0, 192.0, 45.0, 13.0, 4.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-66.82154846191406, -65.54659271240234, -64.2716293334961, -62.99666976928711, -61.721710205078125, -60.44675064086914, -59.171791076660156, -57.89683151245117, -56.62187194824219, -55.3469123840332, -54.07195281982422, -52.796993255615234, -51.52203369140625, -50.247074127197266, -48.97211456298828, -47.6971549987793, -46.42219543457031, -45.14723587036133, -43.872276306152344, -42.59731674194336, -41.322357177734375, -40.04739761352539, -38.772438049316406, -37.49747848510742, -36.2225227355957, -34.94756317138672, -33.672603607177734, -32.39764404296875, -31.122684478759766, -29.84772491455078, -28.572765350341797, -27.297805786132812, -26.022846221923828, -24.747886657714844, -23.47292709350586, -22.197967529296875, -20.92300796508789, -19.648048400878906, -18.373088836669922, -17.098129272460938, -15.823169708251953, -14.548210144042969, -13.273250579833984, -11.998291015625, -10.723331451416016, -9.448371887207031, -8.173413276672363, -6.898453712463379, -5.6234941482543945, -4.34853458404541, -3.073575258255005, -1.7986159324645996, -0.5236563682556152, 0.7513031959533691, 2.0262622833251953, 3.3012218475341797, 4.576181411743164, 5.851140975952148, 7.126100540161133, 8.401060104370117, 9.676019668579102, 10.950979232788086, 12.225937843322754, 13.500897407531738, 14.775856971740723]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 9.0, 7.0, 11.0, 14.0, 15.0, 21.0, 13.0, 27.0, 24.0, 24.0, 31.0, 36.0, 31.0, 40.0, 41.0, 55.0, 47.0, 41.0, 40.0, 53.0, 49.0, 45.0, 46.0, 42.0, 31.0, 33.0, 26.0, 22.0, 11.0, 13.0, 18.0, 17.0, 6.0, 8.0, 4.0, 5.0, 3.0, 8.0, 5.0, 6.0, 1.0, 5.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0], "bins": [-14.417641639709473, -13.977898597717285, -13.538155555725098, -13.098411560058594, -12.658668518066406, -12.218925476074219, -11.779182434082031, -11.339439392089844, -10.899696350097656, -10.459953308105469, -10.020210266113281, -9.580467224121094, -9.14072322845459, -8.700980186462402, -8.261237144470215, -7.821494102478027, -7.381750106811523, -6.942007064819336, -6.50226354598999, -6.062520503997803, -5.622776985168457, -5.1830339431762695, -4.743290901184082, -4.3035478591918945, -3.863804340362549, -3.4240610599517822, -2.9843177795410156, -2.544574737548828, -2.1048314571380615, -1.665088176727295, -1.2253451347351074, -0.7856018543243408, -0.3458595275878906, 0.0938836932182312, 0.533626914024353, 0.9733700752258301, 1.4131133556365967, 1.8528566360473633, 2.292599678039551, 2.7323429584503174, 3.172086238861084, 3.6118295192718506, 4.051572799682617, 4.491315841674805, 4.931058883666992, 5.370802402496338, 5.810545444488525, 6.250288963317871, 6.690032005310059, 7.129775047302246, 7.569518566131592, 8.009262084960938, 8.449005126953125, 8.888748168945312, 9.3284912109375, 9.768234252929688, 10.207977294921875, 10.647720336914062, 11.08746337890625, 11.527206420898438, 11.966950416564941, 12.406693458557129, 12.846436500549316, 13.286179542541504, 13.725923538208008]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 9.0, 9.0, 11.0, 21.0, 41.0, 86.0, 165.0, 413.0, 1401.0, 7140.0, 126198.0, 4013744.0, 39788.0, 3809.0, 881.0, 299.0, 117.0, 58.0, 33.0, 14.0, 18.0, 8.0, 9.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.798828125, -2.706573486328125, -2.61431884765625, -2.522064208984375, -2.4298095703125, -2.337554931640625, -2.24530029296875, -2.153045654296875, -2.060791015625, -1.968536376953125, -1.87628173828125, -1.784027099609375, -1.6917724609375, -1.599517822265625, -1.50726318359375, -1.415008544921875, -1.32275390625, -1.230499267578125, -1.13824462890625, -1.045989990234375, -0.9537353515625, -0.861480712890625, -0.76922607421875, -0.676971435546875, -0.584716796875, -0.492462158203125, -0.40020751953125, -0.307952880859375, -0.2156982421875, -0.123443603515625, -0.03118896484375, 0.061065673828125, 0.1533203125, 0.245574951171875, 0.33782958984375, 0.430084228515625, 0.5223388671875, 0.614593505859375, 0.70684814453125, 0.799102783203125, 0.891357421875, 0.983612060546875, 1.07586669921875, 1.168121337890625, 1.2603759765625, 1.352630615234375, 1.44488525390625, 1.537139892578125, 1.62939453125, 1.721649169921875, 1.81390380859375, 1.906158447265625, 1.9984130859375, 2.090667724609375, 2.18292236328125, 2.275177001953125, 2.367431640625, 2.459686279296875, 2.55194091796875, 2.644195556640625, 2.7364501953125, 2.828704833984375, 2.92095947265625, 3.013214111328125, 3.10546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 11.0, 16.0, 26.0, 35.0, 27.0, 43.0, 58.0, 64.0, 57.0, 66.0, 55.0, 83.0, 62.0, 65.0, 53.0, 73.0, 41.0, 29.0, 26.0, 23.0, 17.0, 17.0, 14.0, 10.0, 7.0, 3.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.892578125, -0.8558502197265625, -0.819122314453125, -0.7823944091796875, -0.74566650390625, -0.7089385986328125, -0.672210693359375, -0.6354827880859375, -0.5987548828125, -0.5620269775390625, -0.525299072265625, -0.4885711669921875, -0.45184326171875, -0.4151153564453125, -0.378387451171875, -0.3416595458984375, -0.304931640625, -0.2682037353515625, -0.231475830078125, -0.1947479248046875, -0.15802001953125, -0.1212921142578125, -0.084564208984375, -0.0478363037109375, -0.0111083984375, 0.0256195068359375, 0.062347412109375, 0.0990753173828125, 0.13580322265625, 0.1725311279296875, 0.209259033203125, 0.2459869384765625, 0.28271484375, 0.3194427490234375, 0.356170654296875, 0.3928985595703125, 0.42962646484375, 0.4663543701171875, 0.503082275390625, 0.5398101806640625, 0.5765380859375, 0.6132659912109375, 0.649993896484375, 0.6867218017578125, 0.72344970703125, 0.7601776123046875, 0.796905517578125, 0.8336334228515625, 0.870361328125, 0.9070892333984375, 0.943817138671875, 0.9805450439453125, 1.01727294921875, 1.0540008544921875, 1.090728759765625, 1.1274566650390625, 1.1641845703125, 1.2009124755859375, 1.237640380859375, 1.2743682861328125, 1.31109619140625, 1.3478240966796875, 1.384552001953125, 1.4212799072265625, 1.4580078125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 4.0, 5.0, 10.0, 17.0, 11.0, 27.0, 27.0, 42.0, 61.0, 71.0, 66.0, 129.0, 142.0, 250.0, 399.0, 923.0, 2383.0, 8295.0, 47940.0, 1279211.0, 2785237.0, 55080.0, 9399.0, 2470.0, 866.0, 425.0, 228.0, 135.0, 103.0, 68.0, 64.0, 45.0, 28.0, 35.0, 26.0, 19.0, 8.0, 6.0, 8.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-1.681640625, -1.63623046875, -1.5908203125, -1.54541015625, -1.5, -1.45458984375, -1.4091796875, -1.36376953125, -1.318359375, -1.27294921875, -1.2275390625, -1.18212890625, -1.13671875, -1.09130859375, -1.0458984375, -1.00048828125, -0.955078125, -0.90966796875, -0.8642578125, -0.81884765625, -0.7734375, -0.72802734375, -0.6826171875, -0.63720703125, -0.591796875, -0.54638671875, -0.5009765625, -0.45556640625, -0.41015625, -0.36474609375, -0.3193359375, -0.27392578125, -0.228515625, -0.18310546875, -0.1376953125, -0.09228515625, -0.046875, -0.00146484375, 0.0439453125, 0.08935546875, 0.134765625, 0.18017578125, 0.2255859375, 0.27099609375, 0.31640625, 0.36181640625, 0.4072265625, 0.45263671875, 0.498046875, 0.54345703125, 0.5888671875, 0.63427734375, 0.6796875, 0.72509765625, 0.7705078125, 0.81591796875, 0.861328125, 0.90673828125, 0.9521484375, 0.99755859375, 1.04296875, 1.08837890625, 1.1337890625, 1.17919921875, 1.224609375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 11.0, 21.0, 47.0, 116.0, 392.0, 2616.0, 599.0, 145.0, 59.0, 28.0, 20.0, 10.0, 7.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.60546875, -1.57177734375, -1.5380859375, -1.50439453125, -1.470703125, -1.43701171875, -1.4033203125, -1.36962890625, -1.3359375, -1.30224609375, -1.2685546875, -1.23486328125, -1.201171875, -1.16748046875, -1.1337890625, -1.10009765625, -1.06640625, -1.03271484375, -0.9990234375, -0.96533203125, -0.931640625, -0.89794921875, -0.8642578125, -0.83056640625, -0.796875, -0.76318359375, -0.7294921875, -0.69580078125, -0.662109375, -0.62841796875, -0.5947265625, -0.56103515625, -0.52734375, -0.49365234375, -0.4599609375, -0.42626953125, -0.392578125, -0.35888671875, -0.3251953125, -0.29150390625, -0.2578125, -0.22412109375, -0.1904296875, -0.15673828125, -0.123046875, -0.08935546875, -0.0556640625, -0.02197265625, 0.01171875, 0.04541015625, 0.0791015625, 0.11279296875, 0.146484375, 0.18017578125, 0.2138671875, 0.24755859375, 0.28125, 0.31494140625, 0.3486328125, 0.38232421875, 0.416015625, 0.44970703125, 0.4833984375, 0.51708984375, 0.55078125]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 5.0, 1.0, 10.0, 30.0, 43.0, 120.0, 220.0, 237.0, 203.0, 85.0, 29.0, 13.0, 6.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.602649211883545, -7.438710689544678, -7.2747721672058105, -7.110833168029785, -6.946894645690918, -6.782956123352051, -6.619017601013184, -6.455079078674316, -6.291140556335449, -6.127202033996582, -5.963263511657715, -5.7993245124816895, -5.635385990142822, -5.471447467803955, -5.307508945465088, -5.143570423126221, -4.979631423950195, -4.815692901611328, -4.651754379272461, -4.4878153800964355, -4.323876857757568, -4.159938335418701, -3.995999813079834, -3.832061290740967, -3.6681225299835205, -3.5041840076446533, -3.340245246887207, -3.17630672454834, -3.0123682022094727, -2.8484294414520264, -2.684490919113159, -2.520552158355713, -2.356614112854004, -2.1926755905151367, -2.0287368297576904, -1.8647983074188232, -1.7008596658706665, -1.5369210243225098, -1.3729825019836426, -1.2090438604354858, -1.045105218887329, -0.8811665773391724, -0.7172279953956604, -0.5532894134521484, -0.3893507719039917, -0.22541213035583496, -0.061473548412323, 0.10246503353118896, 0.2664036750793457, 0.43034228682518005, 0.5942808985710144, 0.7582194805145264, 0.9221581220626831, 1.0860967636108398, 1.250035285949707, 1.4139739274978638, 1.5779125690460205, 1.7418512105941772, 1.905789852142334, 2.069728374481201, 2.2336668968200684, 2.3976056575775146, 2.561544179916382, 2.725482940673828, 2.8894214630126953]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 6.0, 9.0, 19.0, 21.0, 18.0, 26.0, 19.0, 30.0, 35.0, 45.0, 62.0, 52.0, 44.0, 53.0, 54.0, 60.0, 62.0, 47.0, 50.0, 61.0, 45.0, 43.0, 30.0, 21.0, 27.0, 9.0, 9.0, 15.0, 10.0, 9.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3559722900390625, -2.2811644077301025, -2.2063565254211426, -2.1315486431121826, -2.0567407608032227, -1.9819329977035522, -1.9071252346038818, -1.8323173522949219, -1.757509469985962, -1.682701587677002, -1.607893705368042, -1.5330859422683716, -1.4582780599594116, -1.3834701776504517, -1.3086624145507812, -1.2338545322418213, -1.1590466499328613, -1.0842387676239014, -1.0094308853149414, -0.934623122215271, -0.859815239906311, -0.7850073575973511, -0.7101995348930359, -0.6353917121887207, -0.5605838298797607, -0.48577597737312317, -0.4109681248664856, -0.336160272359848, -0.26135241985321045, -0.18654456734657288, -0.1117367148399353, -0.03692889213562012, 0.037878990173339844, 0.11268684267997742, 0.187494695186615, 0.26230254769325256, 0.33711040019989014, 0.4119182527065277, 0.4867261052131653, 0.5615339279174805, 0.6363418102264404, 0.7111496925354004, 0.7859575152397156, 0.8607653379440308, 0.9355732202529907, 1.0103811025619507, 1.085188865661621, 1.159996747970581, 1.234804630279541, 1.309612512588501, 1.384420394897461, 1.4592281579971313, 1.5340360403060913, 1.6088439226150513, 1.6836516857147217, 1.7584595680236816, 1.8332674503326416, 1.9080753326416016, 1.9828832149505615, 2.0576910972595215, 2.1324987411499023, 2.2073066234588623, 2.2821145057678223, 2.3569223880767822, 2.431730270385742]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 7.0, 4.0, 11.0, 9.0, 28.0, 58.0, 119.0, 293.0, 1075.0, 8349.0, 324090.0, 695134.0, 17166.0, 1554.0, 380.0, 131.0, 77.0, 26.0, 17.0, 9.0, 9.0, 7.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9375, -3.7974853515625, -3.657470703125, -3.5174560546875, -3.37744140625, -3.2374267578125, -3.097412109375, -2.9573974609375, -2.8173828125, -2.6773681640625, -2.537353515625, -2.3973388671875, -2.25732421875, -2.1173095703125, -1.977294921875, -1.8372802734375, -1.697265625, -1.5572509765625, -1.417236328125, -1.2772216796875, -1.13720703125, -0.9971923828125, -0.857177734375, -0.7171630859375, -0.5771484375, -0.4371337890625, -0.297119140625, -0.1571044921875, -0.01708984375, 0.1229248046875, 0.262939453125, 0.4029541015625, 0.54296875, 0.6829833984375, 0.822998046875, 0.9630126953125, 1.10302734375, 1.2430419921875, 1.383056640625, 1.5230712890625, 1.6630859375, 1.8031005859375, 1.943115234375, 2.0831298828125, 2.22314453125, 2.3631591796875, 2.503173828125, 2.6431884765625, 2.783203125, 2.9232177734375, 3.063232421875, 3.2032470703125, 3.34326171875, 3.4832763671875, 3.623291015625, 3.7633056640625, 3.9033203125, 4.0433349609375, 4.183349609375, 4.3233642578125, 4.46337890625, 4.6033935546875, 4.743408203125, 4.8834228515625, 5.0234375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 7.0, 15.0, 15.0, 18.0, 35.0, 31.0, 41.0, 48.0, 64.0, 63.0, 59.0, 71.0, 67.0, 55.0, 64.0, 54.0, 62.0, 52.0, 36.0, 36.0, 24.0, 17.0, 19.0, 9.0, 10.0, 6.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80908203125, -0.7731857299804688, -0.7372894287109375, -0.7013931274414062, -0.665496826171875, -0.6296005249023438, -0.5937042236328125, -0.5578079223632812, -0.52191162109375, -0.48601531982421875, -0.4501190185546875, -0.41422271728515625, -0.378326416015625, -0.34243011474609375, -0.3065338134765625, -0.27063751220703125, -0.2347412109375, -0.19884490966796875, -0.1629486083984375, -0.12705230712890625, -0.091156005859375, -0.05525970458984375, -0.0193634033203125, 0.01653289794921875, 0.05242919921875, 0.08832550048828125, 0.1242218017578125, 0.16011810302734375, 0.196014404296875, 0.23191070556640625, 0.2678070068359375, 0.30370330810546875, 0.339599609375, 0.37549591064453125, 0.4113922119140625, 0.44728851318359375, 0.483184814453125, 0.5190811157226562, 0.5549774169921875, 0.5908737182617188, 0.62677001953125, 0.6626663208007812, 0.6985626220703125, 0.7344589233398438, 0.770355224609375, 0.8062515258789062, 0.8421478271484375, 0.8780441284179688, 0.9139404296875, 0.9498367309570312, 0.9857330322265625, 1.0216293334960938, 1.057525634765625, 1.0934219360351562, 1.1293182373046875, 1.1652145385742188, 1.20111083984375, 1.2370071411132812, 1.2729034423828125, 1.3087997436523438, 1.344696044921875, 1.3805923461914062, 1.4164886474609375, 1.4523849487304688, 1.48828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 8.0, 4.0, 10.0, 17.0, 24.0, 38.0, 48.0, 93.0, 124.0, 240.0, 601.0, 1569.0, 7066.0, 167969.0, 837891.0, 27909.0, 3109.0, 982.0, 399.0, 181.0, 103.0, 51.0, 37.0, 24.0, 10.0, 16.0, 7.0, 9.0, 2.0, 1.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.9296875, -2.822235107421875, -2.71478271484375, -2.607330322265625, -2.4998779296875, -2.392425537109375, -2.28497314453125, -2.177520751953125, -2.070068359375, -1.962615966796875, -1.85516357421875, -1.747711181640625, -1.6402587890625, -1.532806396484375, -1.42535400390625, -1.317901611328125, -1.21044921875, -1.102996826171875, -0.99554443359375, -0.888092041015625, -0.7806396484375, -0.673187255859375, -0.56573486328125, -0.458282470703125, -0.350830078125, -0.243377685546875, -0.13592529296875, -0.028472900390625, 0.0789794921875, 0.186431884765625, 0.29388427734375, 0.401336669921875, 0.5087890625, 0.616241455078125, 0.72369384765625, 0.831146240234375, 0.9385986328125, 1.046051025390625, 1.15350341796875, 1.260955810546875, 1.368408203125, 1.475860595703125, 1.58331298828125, 1.690765380859375, 1.7982177734375, 1.905670166015625, 2.01312255859375, 2.120574951171875, 2.22802734375, 2.335479736328125, 2.44293212890625, 2.550384521484375, 2.6578369140625, 2.765289306640625, 2.87274169921875, 2.980194091796875, 3.087646484375, 3.195098876953125, 3.30255126953125, 3.410003662109375, 3.5174560546875, 3.624908447265625, 3.73236083984375, 3.839813232421875, 3.947265625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 8.0, 9.0, 12.0, 11.0, 12.0, 12.0, 28.0, 18.0, 22.0, 27.0, 31.0, 37.0, 30.0, 62.0, 53.0, 52.0, 50.0, 55.0, 46.0, 49.0, 46.0, 34.0, 41.0, 45.0, 36.0, 35.0, 24.0, 26.0, 21.0, 23.0, 9.0, 5.0, 14.0, 9.0, 5.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7890625, -2.68988037109375, -2.5906982421875, -2.49151611328125, -2.392333984375, -2.29315185546875, -2.1939697265625, -2.09478759765625, -1.99560546875, -1.89642333984375, -1.7972412109375, -1.69805908203125, -1.598876953125, -1.49969482421875, -1.4005126953125, -1.30133056640625, -1.2021484375, -1.10296630859375, -1.0037841796875, -0.90460205078125, -0.805419921875, -0.70623779296875, -0.6070556640625, -0.50787353515625, -0.40869140625, -0.30950927734375, -0.2103271484375, -0.11114501953125, -0.011962890625, 0.08721923828125, 0.1864013671875, 0.28558349609375, 0.384765625, 0.48394775390625, 0.5831298828125, 0.68231201171875, 0.781494140625, 0.88067626953125, 0.9798583984375, 1.07904052734375, 1.17822265625, 1.27740478515625, 1.3765869140625, 1.47576904296875, 1.574951171875, 1.67413330078125, 1.7733154296875, 1.87249755859375, 1.9716796875, 2.07086181640625, 2.1700439453125, 2.26922607421875, 2.368408203125, 2.46759033203125, 2.5667724609375, 2.66595458984375, 2.76513671875, 2.86431884765625, 2.9635009765625, 3.06268310546875, 3.161865234375, 3.26104736328125, 3.3602294921875, 3.45941162109375, 3.55859375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 6.0, 10.0, 13.0, 27.0, 27.0, 54.0, 84.0, 136.0, 267.0, 581.0, 1425.0, 4919.0, 28439.0, 312772.0, 630758.0, 57417.0, 7929.0, 2132.0, 775.0, 350.0, 180.0, 96.0, 60.0, 19.0, 22.0, 13.0, 10.0, 8.0, 6.0, 2.0, 4.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.67529296875, -0.6529006958007812, -0.6305084228515625, -0.6081161499023438, -0.585723876953125, -0.5633316040039062, -0.5409393310546875, -0.5185470581054688, -0.49615478515625, -0.47376251220703125, -0.4513702392578125, -0.42897796630859375, -0.406585693359375, -0.38419342041015625, -0.3618011474609375, -0.33940887451171875, -0.3170166015625, -0.29462432861328125, -0.2722320556640625, -0.24983978271484375, -0.227447509765625, -0.20505523681640625, -0.1826629638671875, -0.16027069091796875, -0.13787841796875, -0.11548614501953125, -0.0930938720703125, -0.07070159912109375, -0.048309326171875, -0.02591705322265625, -0.0035247802734375, 0.01886749267578125, 0.041259765625, 0.06365203857421875, 0.0860443115234375, 0.10843658447265625, 0.130828857421875, 0.15322113037109375, 0.1756134033203125, 0.19800567626953125, 0.22039794921875, 0.24279022216796875, 0.2651824951171875, 0.28757476806640625, 0.309967041015625, 0.33235931396484375, 0.3547515869140625, 0.37714385986328125, 0.3995361328125, 0.42192840576171875, 0.4443206787109375, 0.46671295166015625, 0.489105224609375, 0.5114974975585938, 0.5338897705078125, 0.5562820434570312, 0.57867431640625, 0.6010665893554688, 0.6234588623046875, 0.6458511352539062, 0.668243408203125, 0.6906356811523438, 0.7130279541015625, 0.7354202270507812, 0.7578125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 8.0, 7.0, 8.0, 14.0, 17.0, 18.0, 22.0, 18.0, 36.0, 47.0, 57.0, 57.0, 110.0, 114.0, 116.0, 76.0, 64.0, 29.0, 38.0, 25.0, 24.0, 26.0, 13.0, 15.0, 9.0, 6.0, 4.0, 6.0, 6.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00015997886657714844, -0.00015585403889417648, -0.00015172921121120453, -0.00014760438352823257, -0.00014347955584526062, -0.00013935472816228867, -0.0001352299004793167, -0.00013110507279634476, -0.0001269802451133728, -0.00012285541743040085, -0.0001187305897474289, -0.00011460576206445694, -0.00011048093438148499, -0.00010635610669851303, -0.00010223127901554108, -9.810645133256912e-05, -9.398162364959717e-05, -8.985679596662521e-05, -8.573196828365326e-05, -8.16071406006813e-05, -7.748231291770935e-05, -7.33574852347374e-05, -6.923265755176544e-05, -6.510782986879349e-05, -6.098300218582153e-05, -5.685817450284958e-05, -5.2733346819877625e-05, -4.860851913690567e-05, -4.4483691453933716e-05, -4.035886377096176e-05, -3.623403608798981e-05, -3.210920840501785e-05, -2.79843807220459e-05, -2.3859553039073944e-05, -1.973472535610199e-05, -1.5609897673130035e-05, -1.1485069990158081e-05, -7.360242307186127e-06, -3.2354146242141724e-06, 8.89413058757782e-07, 5.014240741729736e-06, 9.13906842470169e-06, 1.3263896107673645e-05, 1.73887237906456e-05, 2.1513551473617554e-05, 2.5638379156589508e-05, 2.9763206839561462e-05, 3.388803452253342e-05, 3.801286220550537e-05, 4.2137689888477325e-05, 4.626251757144928e-05, 5.0387345254421234e-05, 5.451217293739319e-05, 5.863700062036514e-05, 6.27618283033371e-05, 6.688665598630905e-05, 7.1011483669281e-05, 7.513631135225296e-05, 7.926113903522491e-05, 8.338596671819687e-05, 8.751079440116882e-05, 9.163562208414078e-05, 9.576044976711273e-05, 9.988527745008469e-05, 0.00010401010513305664]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 7.0, 10.0, 14.0, 25.0, 39.0, 65.0, 149.0, 290.0, 757.0, 2312.0, 12904.0, 247099.0, 741111.0, 37630.0, 4114.0, 1156.0, 448.0, 198.0, 97.0, 56.0, 38.0, 20.0, 8.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6953125, -0.66400146484375, -0.6326904296875, -0.60137939453125, -0.570068359375, -0.53875732421875, -0.5074462890625, -0.47613525390625, -0.44482421875, -0.41351318359375, -0.3822021484375, -0.35089111328125, -0.319580078125, -0.28826904296875, -0.2569580078125, -0.22564697265625, -0.1943359375, -0.16302490234375, -0.1317138671875, -0.10040283203125, -0.069091796875, -0.03778076171875, -0.0064697265625, 0.02484130859375, 0.05615234375, 0.08746337890625, 0.1187744140625, 0.15008544921875, 0.181396484375, 0.21270751953125, 0.2440185546875, 0.27532958984375, 0.306640625, 0.33795166015625, 0.3692626953125, 0.40057373046875, 0.431884765625, 0.46319580078125, 0.4945068359375, 0.52581787109375, 0.55712890625, 0.58843994140625, 0.6197509765625, 0.65106201171875, 0.682373046875, 0.71368408203125, 0.7449951171875, 0.77630615234375, 0.8076171875, 0.83892822265625, 0.8702392578125, 0.90155029296875, 0.932861328125, 0.96417236328125, 0.9954833984375, 1.02679443359375, 1.05810546875, 1.08941650390625, 1.1207275390625, 1.15203857421875, 1.183349609375, 1.21466064453125, 1.2459716796875, 1.27728271484375, 1.30859375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 7.0, 15.0, 29.0, 34.0, 65.0, 71.0, 91.0, 120.0, 141.0, 113.0, 89.0, 81.0, 52.0, 39.0, 26.0, 10.0, 7.0, 3.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2548828125, -1.22479248046875, -1.1947021484375, -1.16461181640625, -1.134521484375, -1.10443115234375, -1.0743408203125, -1.04425048828125, -1.01416015625, -0.98406982421875, -0.9539794921875, -0.92388916015625, -0.893798828125, -0.86370849609375, -0.8336181640625, -0.80352783203125, -0.7734375, -0.74334716796875, -0.7132568359375, -0.68316650390625, -0.653076171875, -0.62298583984375, -0.5928955078125, -0.56280517578125, -0.53271484375, -0.50262451171875, -0.4725341796875, -0.44244384765625, -0.412353515625, -0.38226318359375, -0.3521728515625, -0.32208251953125, -0.2919921875, -0.26190185546875, -0.2318115234375, -0.20172119140625, -0.171630859375, -0.14154052734375, -0.1114501953125, -0.08135986328125, -0.05126953125, -0.02117919921875, 0.0089111328125, 0.03900146484375, 0.069091796875, 0.09918212890625, 0.1292724609375, 0.15936279296875, 0.189453125, 0.21954345703125, 0.2496337890625, 0.27972412109375, 0.309814453125, 0.33990478515625, 0.3699951171875, 0.40008544921875, 0.43017578125, 0.46026611328125, 0.4903564453125, 0.52044677734375, 0.550537109375, 0.58062744140625, 0.6107177734375, 0.64080810546875, 0.6708984375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 10.0, 41.0, 154.0, 384.0, 299.0, 89.0, 23.0, 4.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.26220703125, -22.197486877441406, -21.13276481628418, -20.068044662475586, -19.00332260131836, -17.938602447509766, -16.873882293701172, -15.809160232543945, -14.744439125061035, -13.679718017578125, -12.614996910095215, -11.550275802612305, -10.485555648803711, -9.420833587646484, -8.35611343383789, -7.2913923263549805, -6.22667121887207, -5.16195011138916, -4.09722900390625, -3.032508373260498, -1.967787265777588, -0.9030661582946777, 0.16165447235107422, 1.2263755798339844, 2.2910966873168945, 3.3558177947998047, 4.420538902282715, 5.485259532928467, 6.549980640411377, 7.614701747894287, 8.679422378540039, 9.74414348602295, 10.80886459350586, 11.87358570098877, 12.93830680847168, 14.003026962280273, 15.0677490234375, 16.132469177246094, 17.197189331054688, 18.261911392211914, 19.32663345336914, 20.391353607177734, 21.45607566833496, 22.520795822143555, 23.58551788330078, 24.650238037109375, 25.71495819091797, 26.779680252075195, 27.84440040588379, 28.909120559692383, 29.97384262084961, 31.038562774658203, 32.1032829284668, 33.168006896972656, 34.23272705078125, 35.297447204589844, 36.36216735839844, 37.42688751220703, 38.491607666015625, 39.556331634521484, 40.62105178833008, 41.68577194213867, 42.750492095947266, 43.815216064453125, 44.87993621826172]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 1.0, 3.0, 12.0, 8.0, 14.0, 16.0, 9.0, 10.0, 26.0, 27.0, 27.0, 36.0, 34.0, 42.0, 48.0, 56.0, 62.0, 56.0, 55.0, 57.0, 54.0, 39.0, 44.0, 36.0, 39.0, 33.0, 20.0, 33.0, 21.0, 15.0, 15.0, 10.0, 15.0, 5.0, 9.0, 2.0, 2.0, 6.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 3.0], "bins": [-16.691482543945312, -16.243114471435547, -15.794747352600098, -15.346379280090332, -14.898012161254883, -14.449644088745117, -14.001276016235352, -13.552907943725586, -13.104540824890137, -12.656172752380371, -12.207805633544922, -11.759437561035156, -11.31106948852539, -10.862702369689941, -10.414334297180176, -9.965967178344727, -9.517599105834961, -9.069231033325195, -8.620863914489746, -8.17249584197998, -7.724128246307373, -7.275760650634766, -6.827392578125, -6.379024982452393, -5.930657386779785, -5.482289791107178, -5.03392219543457, -4.585554122924805, -4.137186527252197, -3.68881893157959, -3.2404510974884033, -2.792083263397217, -2.343714714050293, -1.895346999168396, -1.446979284286499, -0.998611569404602, -0.5502438545227051, -0.10187625885009766, 0.34649157524108887, 0.7948594093322754, 1.2432270050048828, 1.6915947198867798, 2.1399624347686768, 2.5883302688598633, 3.0366978645324707, 3.485065460205078, 3.9334332942962646, 4.381801128387451, 4.830168724060059, 5.278536319732666, 5.726903915405273, 6.175271987915039, 6.6236395835876465, 7.072007179260254, 7.5203752517700195, 7.968742847442627, 8.417110443115234, 8.865478515625, 9.31384563446045, 9.762213706970215, 10.210580825805664, 10.65894889831543, 11.107316970825195, 11.555685043334961, 12.00405216217041]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 8.0, 10.0, 18.0, 15.0, 29.0, 31.0, 41.0, 66.0, 135.0, 258.0, 769.0, 4322.0, 77141.0, 4003911.0, 100592.0, 5126.0, 978.0, 362.0, 159.0, 84.0, 54.0, 37.0, 27.0, 28.0, 16.0, 20.0, 8.0, 6.0, 6.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.0755615234375, -1.990966796875, -1.9063720703125, -1.82177734375, -1.7371826171875, -1.652587890625, -1.5679931640625, -1.4833984375, -1.3988037109375, -1.314208984375, -1.2296142578125, -1.14501953125, -1.0604248046875, -0.975830078125, -0.8912353515625, -0.806640625, -0.7220458984375, -0.637451171875, -0.5528564453125, -0.46826171875, -0.3836669921875, -0.299072265625, -0.2144775390625, -0.1298828125, -0.0452880859375, 0.039306640625, 0.1239013671875, 0.20849609375, 0.2930908203125, 0.377685546875, 0.4622802734375, 0.546875, 0.6314697265625, 0.716064453125, 0.8006591796875, 0.88525390625, 0.9698486328125, 1.054443359375, 1.1390380859375, 1.2236328125, 1.3082275390625, 1.392822265625, 1.4774169921875, 1.56201171875, 1.6466064453125, 1.731201171875, 1.8157958984375, 1.900390625, 1.9849853515625, 2.069580078125, 2.1541748046875, 2.23876953125, 2.3233642578125, 2.407958984375, 2.4925537109375, 2.5771484375, 2.6617431640625, 2.746337890625, 2.8309326171875, 2.91552734375, 3.0001220703125, 3.084716796875, 3.1693115234375, 3.25390625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 9.0, 10.0, 14.0, 17.0, 32.0, 25.0, 36.0, 49.0, 54.0, 75.0, 73.0, 75.0, 73.0, 73.0, 60.0, 55.0, 68.0, 57.0, 38.0, 27.0, 26.0, 14.0, 16.0, 11.0, 5.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80908203125, -0.7746658325195312, -0.7402496337890625, -0.7058334350585938, -0.671417236328125, -0.6370010375976562, -0.6025848388671875, -0.5681686401367188, -0.53375244140625, -0.49933624267578125, -0.4649200439453125, -0.43050384521484375, -0.396087646484375, -0.36167144775390625, -0.3272552490234375, -0.29283905029296875, -0.2584228515625, -0.22400665283203125, -0.1895904541015625, -0.15517425537109375, -0.120758056640625, -0.08634185791015625, -0.0519256591796875, -0.01750946044921875, 0.01690673828125, 0.05132293701171875, 0.0857391357421875, 0.12015533447265625, 0.154571533203125, 0.18898773193359375, 0.2234039306640625, 0.25782012939453125, 0.292236328125, 0.32665252685546875, 0.3610687255859375, 0.39548492431640625, 0.429901123046875, 0.46431732177734375, 0.4987335205078125, 0.5331497192382812, 0.56756591796875, 0.6019821166992188, 0.6363983154296875, 0.6708145141601562, 0.705230712890625, 0.7396469116210938, 0.7740631103515625, 0.8084793090820312, 0.8428955078125, 0.8773117065429688, 0.9117279052734375, 0.9461441040039062, 0.980560302734375, 1.0149765014648438, 1.0493927001953125, 1.0838088989257812, 1.11822509765625, 1.1526412963867188, 1.1870574951171875, 1.2214736938476562, 1.255889892578125, 1.2903060913085938, 1.3247222900390625, 1.3591384887695312, 1.3935546875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 3.0, 12.0, 17.0, 13.0, 21.0, 44.0, 50.0, 226.0, 1139.0, 12645.0, 2168330.0, 1997741.0, 12563.0, 1102.0, 195.0, 74.0, 39.0, 20.0, 18.0, 3.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.98046875, -2.89013671875, -2.7998046875, -2.70947265625, -2.619140625, -2.52880859375, -2.4384765625, -2.34814453125, -2.2578125, -2.16748046875, -2.0771484375, -1.98681640625, -1.896484375, -1.80615234375, -1.7158203125, -1.62548828125, -1.53515625, -1.44482421875, -1.3544921875, -1.26416015625, -1.173828125, -1.08349609375, -0.9931640625, -0.90283203125, -0.8125, -0.72216796875, -0.6318359375, -0.54150390625, -0.451171875, -0.36083984375, -0.2705078125, -0.18017578125, -0.08984375, 0.00048828125, 0.0908203125, 0.18115234375, 0.271484375, 0.36181640625, 0.4521484375, 0.54248046875, 0.6328125, 0.72314453125, 0.8134765625, 0.90380859375, 0.994140625, 1.08447265625, 1.1748046875, 1.26513671875, 1.35546875, 1.44580078125, 1.5361328125, 1.62646484375, 1.716796875, 1.80712890625, 1.8974609375, 1.98779296875, 2.078125, 2.16845703125, 2.2587890625, 2.34912109375, 2.439453125, 2.52978515625, 2.6201171875, 2.71044921875, 2.80078125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 6.0, 1.0, 5.0, 4.0, 19.0, 11.0, 11.0, 10.0, 19.0, 30.0, 59.0, 137.0, 251.0, 533.0, 911.0, 924.0, 545.0, 258.0, 125.0, 71.0, 33.0, 29.0, 19.0, 13.0, 8.0, 11.0, 10.0, 4.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.4658203125, -1.418548583984375, -1.37127685546875, -1.324005126953125, -1.2767333984375, -1.229461669921875, -1.18218994140625, -1.134918212890625, -1.087646484375, -1.040374755859375, -0.99310302734375, -0.945831298828125, -0.8985595703125, -0.851287841796875, -0.80401611328125, -0.756744384765625, -0.70947265625, -0.662200927734375, -0.61492919921875, -0.567657470703125, -0.5203857421875, -0.473114013671875, -0.42584228515625, -0.378570556640625, -0.331298828125, -0.284027099609375, -0.23675537109375, -0.189483642578125, -0.1422119140625, -0.094940185546875, -0.04766845703125, -0.000396728515625, 0.046875, 0.094146728515625, 0.14141845703125, 0.188690185546875, 0.2359619140625, 0.283233642578125, 0.33050537109375, 0.377777099609375, 0.425048828125, 0.472320556640625, 0.51959228515625, 0.566864013671875, 0.6141357421875, 0.661407470703125, 0.70867919921875, 0.755950927734375, 0.80322265625, 0.850494384765625, 0.89776611328125, 0.945037841796875, 0.9923095703125, 1.039581298828125, 1.08685302734375, 1.134124755859375, 1.181396484375, 1.228668212890625, 1.27593994140625, 1.323211669921875, 1.3704833984375, 1.417755126953125, 1.46502685546875, 1.512298583984375, 1.5595703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 5.0, 7.0, 8.0, 19.0, 48.0, 85.0, 122.0, 167.0, 175.0, 126.0, 101.0, 49.0, 35.0, 18.0, 11.0, 4.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.272506237030029, -4.970510005950928, -4.668514251708984, -4.366518020629883, -4.064521789550781, -3.762526035308838, -3.4605298042297363, -3.158533811569214, -2.8565378189086914, -2.554541826248169, -2.2525458335876465, -1.950549602508545, -1.6485536098480225, -1.3465576171875, -1.044561505317688, -0.742565393447876, -0.4405694007873535, -0.13857334852218628, 0.16342270374298096, 0.4654187560081482, 0.7674148082733154, 1.069410800933838, 1.37140691280365, 1.673403024673462, 1.9753990173339844, 2.277395009994507, 2.5793910026550293, 2.881387233734131, 3.1833832263946533, 3.485379219055176, 3.7873754501342773, 4.089371681213379, 4.391366958618164, 4.693363189697266, 4.995358943939209, 5.2973551750183105, 5.599350929260254, 5.9013471603393555, 6.203343391418457, 6.505339622497559, 6.807335376739502, 7.1093316078186035, 7.411327362060547, 7.713323593139648, 8.01531982421875, 8.317316055297852, 8.619311332702637, 8.921307563781738, 9.22330379486084, 9.525300025939941, 9.827296257019043, 10.129291534423828, 10.43128776550293, 10.733283996582031, 11.035280227661133, 11.337276458740234, 11.639272689819336, 11.941268920898438, 12.243265151977539, 12.545260429382324, 12.847256660461426, 13.149252891540527, 13.451249122619629, 13.75324535369873, 14.055240631103516]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 6.0, 3.0, 8.0, 6.0, 10.0, 4.0, 7.0, 20.0, 17.0, 12.0, 17.0, 25.0, 29.0, 26.0, 28.0, 32.0, 43.0, 37.0, 42.0, 33.0, 38.0, 42.0, 34.0, 50.0, 37.0, 33.0, 41.0, 34.0, 33.0, 31.0, 31.0, 20.0, 24.0, 21.0, 21.0, 18.0, 11.0, 12.0, 18.0, 7.0, 6.0, 10.0, 7.0, 5.0, 1.0, 3.0, 5.0, 2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.2321929931640625, -4.081872463226318, -3.931551933288574, -3.78123140335083, -3.630910873413086, -3.480590343475342, -3.3302698135375977, -3.1799492835998535, -3.0296287536621094, -2.8793082237243652, -2.728987693786621, -2.578667163848877, -2.428346633911133, -2.2780261039733887, -2.1277055740356445, -1.9773850440979004, -1.8270645141601562, -1.676743984222412, -1.526423454284668, -1.3761029243469238, -1.2257823944091797, -1.0754618644714355, -0.9251413345336914, -0.7748208045959473, -0.6245002746582031, -0.474179744720459, -0.32385921478271484, -0.1735386848449707, -0.023218154907226562, 0.12710237503051758, 0.2774229049682617, 0.42774343490600586, 0.5780644416809082, 0.7283849716186523, 0.8787055015563965, 1.0290260314941406, 1.1793465614318848, 1.329667091369629, 1.479987621307373, 1.6303081512451172, 1.7806286811828613, 1.9309492111206055, 2.0812697410583496, 2.2315902709960938, 2.381910800933838, 2.532231330871582, 2.682551860809326, 2.8328723907470703, 2.9831929206848145, 3.1335134506225586, 3.2838339805603027, 3.434154510498047, 3.584475040435791, 3.734795570373535, 3.8851161003112793, 4.035436630249023, 4.185757160186768, 4.336077690124512, 4.486398220062256, 4.63671875, 4.787039279937744, 4.937359809875488, 5.087680339813232, 5.238000869750977, 5.388321399688721]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 12.0, 16.0, 17.0, 23.0, 32.0, 47.0, 80.0, 115.0, 200.0, 293.0, 489.0, 929.0, 1690.0, 3221.0, 6746.0, 14507.0, 34122.0, 84776.0, 216753.0, 362937.0, 191897.0, 73886.0, 30270.0, 12967.0, 5904.0, 2968.0, 1500.0, 840.0, 482.0, 268.0, 203.0, 113.0, 73.0, 50.0, 34.0, 22.0, 15.0, 12.0, 11.0, 6.0, 6.0, 7.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.82177734375, -0.7956314086914062, -0.7694854736328125, -0.7433395385742188, -0.717193603515625, -0.6910476684570312, -0.6649017333984375, -0.6387557983398438, -0.61260986328125, -0.5864639282226562, -0.5603179931640625, -0.5341720581054688, -0.508026123046875, -0.48188018798828125, -0.4557342529296875, -0.42958831787109375, -0.4034423828125, -0.37729644775390625, -0.3511505126953125, -0.32500457763671875, -0.298858642578125, -0.27271270751953125, -0.2465667724609375, -0.22042083740234375, -0.19427490234375, -0.16812896728515625, -0.1419830322265625, -0.11583709716796875, -0.089691162109375, -0.06354522705078125, -0.0373992919921875, -0.01125335693359375, 0.014892578125, 0.04103851318359375, 0.0671844482421875, 0.09333038330078125, 0.119476318359375, 0.14562225341796875, 0.1717681884765625, 0.19791412353515625, 0.22406005859375, 0.25020599365234375, 0.2763519287109375, 0.30249786376953125, 0.328643798828125, 0.35478973388671875, 0.3809356689453125, 0.40708160400390625, 0.4332275390625, 0.45937347412109375, 0.4855194091796875, 0.5116653442382812, 0.537811279296875, 0.5639572143554688, 0.5901031494140625, 0.6162490844726562, 0.64239501953125, 0.6685409545898438, 0.6946868896484375, 0.7208328247070312, 0.746978759765625, 0.7731246948242188, 0.7992706298828125, 0.8254165649414062, 0.8515625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 4.0, 10.0, 17.0, 21.0, 29.0, 31.0, 32.0, 64.0, 50.0, 61.0, 70.0, 78.0, 85.0, 58.0, 75.0, 62.0, 61.0, 57.0, 35.0, 25.0, 24.0, 17.0, 10.0, 5.0, 7.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81689453125, -0.7819290161132812, -0.7469635009765625, -0.7119979858398438, -0.677032470703125, -0.6420669555664062, -0.6071014404296875, -0.5721359252929688, -0.53717041015625, -0.5022048950195312, -0.4672393798828125, -0.43227386474609375, -0.397308349609375, -0.36234283447265625, -0.3273773193359375, -0.29241180419921875, -0.2574462890625, -0.22248077392578125, -0.1875152587890625, -0.15254974365234375, -0.117584228515625, -0.08261871337890625, -0.0476531982421875, -0.01268768310546875, 0.02227783203125, 0.05724334716796875, 0.0922088623046875, 0.12717437744140625, 0.162139892578125, 0.19710540771484375, 0.2320709228515625, 0.26703643798828125, 0.302001953125, 0.33696746826171875, 0.3719329833984375, 0.40689849853515625, 0.441864013671875, 0.47682952880859375, 0.5117950439453125, 0.5467605590820312, 0.58172607421875, 0.6166915893554688, 0.6516571044921875, 0.6866226196289062, 0.721588134765625, 0.7565536499023438, 0.7915191650390625, 0.8264846801757812, 0.8614501953125, 0.8964157104492188, 0.9313812255859375, 0.9663467407226562, 1.001312255859375, 1.0362777709960938, 1.0712432861328125, 1.1062088012695312, 1.14117431640625, 1.1761398315429688, 1.2111053466796875, 1.2460708618164062, 1.281036376953125, 1.3160018920898438, 1.3509674072265625, 1.3859329223632812, 1.4208984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 7.0, 4.0, 2.0, 4.0, 6.0, 13.0, 8.0, 10.0, 21.0, 30.0, 41.0, 69.0, 107.0, 141.0, 281.0, 434.0, 754.0, 1366.0, 3491.0, 16239.0, 205922.0, 750106.0, 57772.0, 7138.0, 2207.0, 988.0, 517.0, 325.0, 187.0, 96.0, 86.0, 57.0, 40.0, 26.0, 18.0, 15.0, 10.0, 5.0, 5.0, 2.0, 7.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9775390625, -1.916259765625, -1.85498046875, -1.793701171875, -1.732421875, -1.671142578125, -1.60986328125, -1.548583984375, -1.4873046875, -1.426025390625, -1.36474609375, -1.303466796875, -1.2421875, -1.180908203125, -1.11962890625, -1.058349609375, -0.9970703125, -0.935791015625, -0.87451171875, -0.813232421875, -0.751953125, -0.690673828125, -0.62939453125, -0.568115234375, -0.5068359375, -0.445556640625, -0.38427734375, -0.322998046875, -0.26171875, -0.200439453125, -0.13916015625, -0.077880859375, -0.0166015625, 0.044677734375, 0.10595703125, 0.167236328125, 0.228515625, 0.289794921875, 0.35107421875, 0.412353515625, 0.4736328125, 0.534912109375, 0.59619140625, 0.657470703125, 0.71875, 0.780029296875, 0.84130859375, 0.902587890625, 0.9638671875, 1.025146484375, 1.08642578125, 1.147705078125, 1.208984375, 1.270263671875, 1.33154296875, 1.392822265625, 1.4541015625, 1.515380859375, 1.57666015625, 1.637939453125, 1.69921875, 1.760498046875, 1.82177734375, 1.883056640625, 1.9443359375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 8.0, 4.0, 9.0, 9.0, 10.0, 11.0, 18.0, 15.0, 20.0, 17.0, 21.0, 16.0, 35.0, 29.0, 31.0, 42.0, 38.0, 43.0, 47.0, 46.0, 47.0, 51.0, 56.0, 39.0, 45.0, 37.0, 24.0, 34.0, 36.0, 30.0, 26.0, 13.0, 14.0, 19.0, 17.0, 10.0, 9.0, 8.0, 2.0, 6.0, 0.0, 7.0, 0.0, 0.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-2.408203125, -2.3345947265625, -2.260986328125, -2.1873779296875, -2.11376953125, -2.0401611328125, -1.966552734375, -1.8929443359375, -1.8193359375, -1.7457275390625, -1.672119140625, -1.5985107421875, -1.52490234375, -1.4512939453125, -1.377685546875, -1.3040771484375, -1.23046875, -1.1568603515625, -1.083251953125, -1.0096435546875, -0.93603515625, -0.8624267578125, -0.788818359375, -0.7152099609375, -0.6416015625, -0.5679931640625, -0.494384765625, -0.4207763671875, -0.34716796875, -0.2735595703125, -0.199951171875, -0.1263427734375, -0.052734375, 0.0208740234375, 0.094482421875, 0.1680908203125, 0.24169921875, 0.3153076171875, 0.388916015625, 0.4625244140625, 0.5361328125, 0.6097412109375, 0.683349609375, 0.7569580078125, 0.83056640625, 0.9041748046875, 0.977783203125, 1.0513916015625, 1.125, 1.1986083984375, 1.272216796875, 1.3458251953125, 1.41943359375, 1.4930419921875, 1.566650390625, 1.6402587890625, 1.7138671875, 1.7874755859375, 1.861083984375, 1.9346923828125, 2.00830078125, 2.0819091796875, 2.155517578125, 2.2291259765625, 2.302734375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 13.0, 11.0, 17.0, 22.0, 29.0, 59.0, 76.0, 195.0, 422.0, 1079.0, 3723.0, 23661.0, 558245.0, 434105.0, 21528.0, 3484.0, 1020.0, 418.0, 181.0, 101.0, 65.0, 37.0, 12.0, 18.0, 8.0, 4.0, 5.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.94921875, -0.9185791015625, -0.887939453125, -0.8572998046875, -0.82666015625, -0.7960205078125, -0.765380859375, -0.7347412109375, -0.7041015625, -0.6734619140625, -0.642822265625, -0.6121826171875, -0.58154296875, -0.5509033203125, -0.520263671875, -0.4896240234375, -0.458984375, -0.4283447265625, -0.397705078125, -0.3670654296875, -0.33642578125, -0.3057861328125, -0.275146484375, -0.2445068359375, -0.2138671875, -0.1832275390625, -0.152587890625, -0.1219482421875, -0.09130859375, -0.0606689453125, -0.030029296875, 0.0006103515625, 0.03125, 0.0618896484375, 0.092529296875, 0.1231689453125, 0.15380859375, 0.1844482421875, 0.215087890625, 0.2457275390625, 0.2763671875, 0.3070068359375, 0.337646484375, 0.3682861328125, 0.39892578125, 0.4295654296875, 0.460205078125, 0.4908447265625, 0.521484375, 0.5521240234375, 0.582763671875, 0.6134033203125, 0.64404296875, 0.6746826171875, 0.705322265625, 0.7359619140625, 0.7666015625, 0.7972412109375, 0.827880859375, 0.8585205078125, 0.88916015625, 0.9197998046875, 0.950439453125, 0.9810791015625, 1.01171875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 9.0, 14.0, 15.0, 16.0, 11.0, 14.0, 19.0, 24.0, 14.0, 29.0, 33.0, 40.0, 49.0, 66.0, 100.0, 115.0, 92.0, 75.0, 67.0, 42.0, 28.0, 24.0, 11.0, 14.0, 14.0, 7.0, 8.0, 4.0, 8.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.0001188516616821289, -0.00011519528925418854, -0.00011153891682624817, -0.0001078825443983078, -0.00010422617197036743, -0.00010056979954242706, -9.69134271144867e-05, -9.325705468654633e-05, -8.960068225860596e-05, -8.594430983066559e-05, -8.228793740272522e-05, -7.863156497478485e-05, -7.497519254684448e-05, -7.131882011890411e-05, -6.766244769096375e-05, -6.400607526302338e-05, -6.034970283508301e-05, -5.669333040714264e-05, -5.303695797920227e-05, -4.93805855512619e-05, -4.572421312332153e-05, -4.2067840695381165e-05, -3.8411468267440796e-05, -3.475509583950043e-05, -3.109872341156006e-05, -2.744235098361969e-05, -2.378597855567932e-05, -2.0129606127738953e-05, -1.6473233699798584e-05, -1.2816861271858215e-05, -9.160488843917847e-06, -5.504116415977478e-06, -1.8477439880371094e-06, 1.8086284399032593e-06, 5.465000867843628e-06, 9.121373295783997e-06, 1.2777745723724365e-05, 1.6434118151664734e-05, 2.0090490579605103e-05, 2.374686300754547e-05, 2.740323543548584e-05, 3.105960786342621e-05, 3.471598029136658e-05, 3.8372352719306946e-05, 4.2028725147247314e-05, 4.568509757518768e-05, 4.934147000312805e-05, 5.299784243106842e-05, 5.665421485900879e-05, 6.031058728694916e-05, 6.396695971488953e-05, 6.76233321428299e-05, 7.127970457077026e-05, 7.493607699871063e-05, 7.8592449426651e-05, 8.224882185459137e-05, 8.590519428253174e-05, 8.956156671047211e-05, 9.321793913841248e-05, 9.687431156635284e-05, 0.00010053068399429321, 0.00010418705642223358, 0.00010784342885017395, 0.00011149980127811432, 0.00011515617370605469]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 10.0, 5.0, 17.0, 18.0, 18.0, 34.0, 64.0, 72.0, 116.0, 205.0, 346.0, 563.0, 1244.0, 3031.0, 10121.0, 53602.0, 646935.0, 289569.0, 31258.0, 6929.0, 2249.0, 893.0, 512.0, 294.0, 161.0, 106.0, 59.0, 36.0, 32.0, 17.0, 8.0, 11.0, 3.0, 5.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0], "bins": [-0.904296875, -0.8797607421875, -0.855224609375, -0.8306884765625, -0.80615234375, -0.7816162109375, -0.757080078125, -0.7325439453125, -0.7080078125, -0.6834716796875, -0.658935546875, -0.6343994140625, -0.60986328125, -0.5853271484375, -0.560791015625, -0.5362548828125, -0.51171875, -0.4871826171875, -0.462646484375, -0.4381103515625, -0.41357421875, -0.3890380859375, -0.364501953125, -0.3399658203125, -0.3154296875, -0.2908935546875, -0.266357421875, -0.2418212890625, -0.21728515625, -0.1927490234375, -0.168212890625, -0.1436767578125, -0.119140625, -0.0946044921875, -0.070068359375, -0.0455322265625, -0.02099609375, 0.0035400390625, 0.028076171875, 0.0526123046875, 0.0771484375, 0.1016845703125, 0.126220703125, 0.1507568359375, 0.17529296875, 0.1998291015625, 0.224365234375, 0.2489013671875, 0.2734375, 0.2979736328125, 0.322509765625, 0.3470458984375, 0.37158203125, 0.3961181640625, 0.420654296875, 0.4451904296875, 0.4697265625, 0.4942626953125, 0.518798828125, 0.5433349609375, 0.56787109375, 0.5924072265625, 0.616943359375, 0.6414794921875, 0.666015625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 6.0, 7.0, 9.0, 15.0, 12.0, 15.0, 23.0, 18.0, 30.0, 34.0, 60.0, 84.0, 101.0, 78.0, 92.0, 66.0, 81.0, 69.0, 55.0, 23.0, 28.0, 15.0, 9.0, 12.0, 11.0, 8.0, 9.0, 9.0, 3.0, 4.0, 6.0, 3.0, 3.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6015625, -0.581451416015625, -0.56134033203125, -0.541229248046875, -0.5211181640625, -0.501007080078125, -0.48089599609375, -0.460784912109375, -0.440673828125, -0.420562744140625, -0.40045166015625, -0.380340576171875, -0.3602294921875, -0.340118408203125, -0.32000732421875, -0.299896240234375, -0.27978515625, -0.259674072265625, -0.23956298828125, -0.219451904296875, -0.1993408203125, -0.179229736328125, -0.15911865234375, -0.139007568359375, -0.118896484375, -0.098785400390625, -0.07867431640625, -0.058563232421875, -0.0384521484375, -0.018341064453125, 0.00177001953125, 0.021881103515625, 0.0419921875, 0.062103271484375, 0.08221435546875, 0.102325439453125, 0.1224365234375, 0.142547607421875, 0.16265869140625, 0.182769775390625, 0.202880859375, 0.222991943359375, 0.24310302734375, 0.263214111328125, 0.2833251953125, 0.303436279296875, 0.32354736328125, 0.343658447265625, 0.36376953125, 0.383880615234375, 0.40399169921875, 0.424102783203125, 0.4442138671875, 0.464324951171875, 0.48443603515625, 0.504547119140625, 0.524658203125, 0.544769287109375, 0.56488037109375, 0.584991455078125, 0.6051025390625, 0.625213623046875, 0.64532470703125, 0.665435791015625, 0.685546875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 6.0, 13.0, 13.0, 45.0, 72.0, 144.0, 230.0, 222.0, 139.0, 56.0, 29.0, 7.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.341004371643066, -14.890397071838379, -14.439789772033691, -13.989182472229004, -13.538575172424316, -13.087967872619629, -12.637360572814941, -12.186753273010254, -11.736145973205566, -11.285538673400879, -10.834931373596191, -10.384324073791504, -9.933716773986816, -9.483109474182129, -9.032502174377441, -8.581894874572754, -8.131287574768066, -7.680680274963379, -7.230072975158691, -6.779465675354004, -6.328858375549316, -5.878251075744629, -5.427643775939941, -4.977036476135254, -4.526429176330566, -4.075821876525879, -3.6252145767211914, -3.174607276916504, -2.7239999771118164, -2.273392677307129, -1.8227853775024414, -1.372178077697754, -0.9215717315673828, -0.4709644317626953, -0.020357131958007812, 0.4302501678466797, 0.8808574676513672, 1.3314647674560547, 1.7820720672607422, 2.2326793670654297, 2.683286666870117, 3.1338939666748047, 3.584501266479492, 4.03510856628418, 4.485715866088867, 4.936323165893555, 5.386930465698242, 5.83753776550293, 6.288145065307617, 6.738752365112305, 7.189359664916992, 7.63996696472168, 8.090574264526367, 8.541181564331055, 8.991788864135742, 9.44239616394043, 9.893003463745117, 10.343610763549805, 10.794218063354492, 11.24482536315918, 11.695432662963867, 12.146039962768555, 12.596647262573242, 13.04725456237793, 13.497861862182617]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 4.0, 2.0, 5.0, 7.0, 7.0, 6.0, 9.0, 18.0, 10.0, 23.0, 17.0, 15.0, 33.0, 24.0, 16.0, 15.0, 31.0, 34.0, 34.0, 43.0, 39.0, 58.0, 43.0, 73.0, 45.0, 47.0, 36.0, 42.0, 40.0, 33.0, 35.0, 16.0, 25.0, 13.0, 22.0, 19.0, 12.0, 13.0, 5.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.157661437988281, -8.869791030883789, -8.581920623779297, -8.294050216674805, -8.006179809570312, -7.718308925628662, -7.430438041687012, -7.1425676345825195, -6.854697227478027, -6.566826820373535, -6.278956413269043, -5.991085529327393, -5.7032151222229, -5.415344715118408, -5.127473831176758, -4.839603424072266, -4.551733016967773, -4.263862609863281, -3.97599196434021, -3.6881213188171387, -3.4002509117126465, -3.1123805046081543, -2.824509859085083, -2.5366392135620117, -2.2487688064575195, -1.9608982801437378, -1.673027753829956, -1.3851572275161743, -1.0972867012023926, -0.8094161748886108, -0.5215456485748291, -0.2336750030517578, 0.05419635772705078, 0.3420668840408325, 0.6299374103546143, 0.917807936668396, 1.2056784629821777, 1.4935489892959595, 1.7814195156097412, 2.0692901611328125, 2.3571605682373047, 2.645030975341797, 2.932901620864868, 3.2207722663879395, 3.5086426734924316, 3.796513080596924, 4.084383964538574, 4.372254371643066, 4.660124778747559, 4.947995185852051, 5.235865592956543, 5.523736476898193, 5.8116068840026855, 6.099477291107178, 6.387348175048828, 6.67521858215332, 6.9630889892578125, 7.250959396362305, 7.538829803466797, 7.826700687408447, 8.114570617675781, 8.40244197845459, 8.690312385559082, 8.978182792663574, 9.266053199768066]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 4.0, 13.0, 10.0, 11.0, 14.0, 30.0, 39.0, 42.0, 53.0, 74.0, 103.0, 164.0, 261.0, 667.0, 2589.0, 42211.0, 4078325.0, 64809.0, 3080.0, 780.0, 359.0, 197.0, 122.0, 85.0, 50.0, 41.0, 27.0, 31.0, 14.0, 21.0, 14.0, 6.0, 7.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.126953125, -3.03375244140625, -2.9405517578125, -2.84735107421875, -2.754150390625, -2.66094970703125, -2.5677490234375, -2.47454833984375, -2.38134765625, -2.28814697265625, -2.1949462890625, -2.10174560546875, -2.008544921875, -1.91534423828125, -1.8221435546875, -1.72894287109375, -1.6357421875, -1.54254150390625, -1.4493408203125, -1.35614013671875, -1.262939453125, -1.16973876953125, -1.0765380859375, -0.98333740234375, -0.89013671875, -0.79693603515625, -0.7037353515625, -0.61053466796875, -0.517333984375, -0.42413330078125, -0.3309326171875, -0.23773193359375, -0.14453125, -0.05133056640625, 0.0418701171875, 0.13507080078125, 0.228271484375, 0.32147216796875, 0.4146728515625, 0.50787353515625, 0.60107421875, 0.69427490234375, 0.7874755859375, 0.88067626953125, 0.973876953125, 1.06707763671875, 1.1602783203125, 1.25347900390625, 1.3466796875, 1.43988037109375, 1.5330810546875, 1.62628173828125, 1.719482421875, 1.81268310546875, 1.9058837890625, 1.99908447265625, 2.09228515625, 2.18548583984375, 2.2786865234375, 2.37188720703125, 2.465087890625, 2.55828857421875, 2.6514892578125, 2.74468994140625, 2.837890625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 5.0, 8.0, 12.0, 13.0, 22.0, 19.0, 33.0, 28.0, 70.0, 57.0, 60.0, 70.0, 86.0, 81.0, 61.0, 69.0, 71.0, 48.0, 40.0, 39.0, 29.0, 26.0, 20.0, 7.0, 11.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.82666015625, -0.7940444946289062, -0.7614288330078125, -0.7288131713867188, -0.696197509765625, -0.6635818481445312, -0.6309661865234375, -0.5983505249023438, -0.56573486328125, -0.5331192016601562, -0.5005035400390625, -0.46788787841796875, -0.435272216796875, -0.40265655517578125, -0.3700408935546875, -0.33742523193359375, -0.3048095703125, -0.27219390869140625, -0.2395782470703125, -0.20696258544921875, -0.174346923828125, -0.14173126220703125, -0.1091156005859375, -0.07649993896484375, -0.04388427734375, -0.01126861572265625, 0.0213470458984375, 0.05396270751953125, 0.086578369140625, 0.11919403076171875, 0.1518096923828125, 0.18442535400390625, 0.217041015625, 0.24965667724609375, 0.2822723388671875, 0.31488800048828125, 0.347503662109375, 0.38011932373046875, 0.4127349853515625, 0.44535064697265625, 0.47796630859375, 0.5105819702148438, 0.5431976318359375, 0.5758132934570312, 0.608428955078125, 0.6410446166992188, 0.6736602783203125, 0.7062759399414062, 0.7388916015625, 0.7715072631835938, 0.8041229248046875, 0.8367385864257812, 0.869354248046875, 0.9019699096679688, 0.9345855712890625, 0.9672012329101562, 0.99981689453125, 1.0324325561523438, 1.0650482177734375, 1.0976638793945312, 1.130279541015625, 1.1628952026367188, 1.1955108642578125, 1.2281265258789062, 1.2607421875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 2.0, 6.0, 2.0, 2.0, 4.0, 10.0, 19.0, 32.0, 53.0, 84.0, 143.0, 256.0, 547.0, 1027.0, 2147.0, 5595.0, 15924.0, 66020.0, 648068.0, 3007209.0, 378150.0, 48402.0, 12931.0, 4370.0, 1759.0, 777.0, 342.0, 183.0, 91.0, 47.0, 30.0, 13.0, 9.0, 7.0, 6.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.90869140625, -0.8814849853515625, -0.854278564453125, -0.8270721435546875, -0.79986572265625, -0.7726593017578125, -0.745452880859375, -0.7182464599609375, -0.6910400390625, -0.6638336181640625, -0.636627197265625, -0.6094207763671875, -0.58221435546875, -0.5550079345703125, -0.527801513671875, -0.5005950927734375, -0.473388671875, -0.4461822509765625, -0.418975830078125, -0.3917694091796875, -0.36456298828125, -0.3373565673828125, -0.310150146484375, -0.2829437255859375, -0.2557373046875, -0.2285308837890625, -0.201324462890625, -0.1741180419921875, -0.14691162109375, -0.1197052001953125, -0.092498779296875, -0.0652923583984375, -0.0380859375, -0.0108795166015625, 0.016326904296875, 0.0435333251953125, 0.07073974609375, 0.0979461669921875, 0.125152587890625, 0.1523590087890625, 0.1795654296875, 0.2067718505859375, 0.233978271484375, 0.2611846923828125, 0.28839111328125, 0.3155975341796875, 0.342803955078125, 0.3700103759765625, 0.397216796875, 0.4244232177734375, 0.451629638671875, 0.4788360595703125, 0.50604248046875, 0.5332489013671875, 0.560455322265625, 0.5876617431640625, 0.6148681640625, 0.6420745849609375, 0.669281005859375, 0.6964874267578125, 0.72369384765625, 0.7509002685546875, 0.778106689453125, 0.8053131103515625, 0.83251953125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 5.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 11.0, 22.0, 25.0, 37.0, 57.0, 126.0, 237.0, 467.0, 708.0, 915.0, 641.0, 365.0, 187.0, 100.0, 48.0, 33.0, 23.0, 9.0, 10.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.451171875, -1.4132614135742188, -1.3753509521484375, -1.3374404907226562, -1.299530029296875, -1.2616195678710938, -1.2237091064453125, -1.1857986450195312, -1.14788818359375, -1.1099777221679688, -1.0720672607421875, -1.0341567993164062, -0.996246337890625, -0.9583358764648438, -0.9204254150390625, -0.8825149536132812, -0.8446044921875, -0.8066940307617188, -0.7687835693359375, -0.7308731079101562, -0.692962646484375, -0.6550521850585938, -0.6171417236328125, -0.5792312622070312, -0.54132080078125, -0.5034103393554688, -0.4654998779296875, -0.42758941650390625, -0.389678955078125, -0.35176849365234375, -0.3138580322265625, -0.27594757080078125, -0.238037109375, -0.20012664794921875, -0.1622161865234375, -0.12430572509765625, -0.086395263671875, -0.04848480224609375, -0.0105743408203125, 0.02733612060546875, 0.06524658203125, 0.10315704345703125, 0.1410675048828125, 0.17897796630859375, 0.216888427734375, 0.25479888916015625, 0.2927093505859375, 0.33061981201171875, 0.3685302734375, 0.40644073486328125, 0.4443511962890625, 0.48226165771484375, 0.520172119140625, 0.5580825805664062, 0.5959930419921875, 0.6339035034179688, 0.67181396484375, 0.7097244262695312, 0.7476348876953125, 0.7855453491210938, 0.823455810546875, 0.8613662719726562, 0.8992767333984375, 0.9371871948242188, 0.97509765625]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 8.0, 5.0, 20.0, 70.0, 192.0, 312.0, 228.0, 100.0, 30.0, 14.0, 8.0, 4.0, 5.0, 2.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.750802993774414, -10.328902244567871, -9.907002449035645, -9.485101699829102, -9.063200950622559, -8.641300201416016, -8.219400405883789, -7.797499656677246, -7.375598907470703, -6.953698635101318, -6.531797885894775, -6.109897613525391, -5.687996864318848, -5.266096591949463, -4.844196319580078, -4.422295570373535, -4.00039529800415, -3.5784947872161865, -3.1565942764282227, -2.734694004058838, -2.312793254852295, -1.8908929824829102, -1.4689924716949463, -1.0470919609069824, -0.6251914501190186, -0.20329096913337708, 0.2186095118522644, 0.6405099630355835, 1.0624104738235474, 1.4843108654022217, 1.9062113761901855, 2.3281118869781494, 2.7500123977661133, 3.171912908554077, 3.593813419342041, 4.015713691711426, 4.437614440917969, 4.8595147132873535, 5.281414985656738, 5.703315734863281, 6.125216484069824, 6.547116756439209, 6.969017505645752, 7.390917778015137, 7.81281852722168, 8.234718322753906, 8.65661907196045, 9.078519821166992, 9.500419616699219, 9.922320365905762, 10.344220161437988, 10.766120910644531, 11.188021659851074, 11.609922409057617, 12.031822204589844, 12.453722953796387, 12.87562370300293, 13.297524452209473, 13.7194242477417, 14.141324996948242, 14.563225746154785, 14.985126495361328, 15.407026290893555, 15.828927040100098, 16.25082778930664]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 5.0, 5.0, 4.0, 9.0, 7.0, 16.0, 12.0, 15.0, 18.0, 27.0, 26.0, 25.0, 27.0, 38.0, 34.0, 31.0, 36.0, 51.0, 39.0, 36.0, 37.0, 48.0, 44.0, 41.0, 38.0, 30.0, 40.0, 34.0, 30.0, 35.0, 26.0, 15.0, 20.0, 13.0, 14.0, 11.0, 10.0, 10.0, 12.0, 11.0, 9.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.6995177268981934, -3.5844409465789795, -3.4693641662597656, -3.354287624359131, -3.239210844039917, -3.124134063720703, -3.0090572834014893, -2.8939805030822754, -2.7789039611816406, -2.6638271808624268, -2.548750400543213, -2.433673858642578, -2.3185970783233643, -2.2035202980041504, -2.0884435176849365, -1.9733667373657227, -1.8582899570465088, -1.743213176727295, -1.6281365156173706, -1.5130597352981567, -1.3979830741882324, -1.2829062938690186, -1.1678295135498047, -1.0527527332305908, -0.9376760721206665, -0.8225993514060974, -0.7075226306915283, -0.5924458503723145, -0.47736912965774536, -0.36229240894317627, -0.2472156286239624, -0.1321389079093933, -0.01706218719482422, 0.09801454842090607, 0.21309128403663635, 0.32816803455352783, 0.4432447552680969, 0.558321475982666, 0.6733982563018799, 0.788474977016449, 0.9035516977310181, 1.018628478050232, 1.1337051391601562, 1.2487819194793701, 1.363858699798584, 1.4789353609085083, 1.5940121412277222, 1.7090888023376465, 1.8241655826568604, 1.9392423629760742, 2.054319143295288, 2.169395923614502, 2.2844724655151367, 2.3995492458343506, 2.5146260261535645, 2.6297028064727783, 2.744779586791992, 2.859856367111206, 2.97493314743042, 3.0900096893310547, 3.2050864696502686, 3.3201632499694824, 3.4352400302886963, 3.55031681060791, 3.665393352508545]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 5.0, 8.0, 6.0, 14.0, 18.0, 27.0, 27.0, 52.0, 81.0, 107.0, 141.0, 244.0, 343.0, 566.0, 1025.0, 1716.0, 3193.0, 6241.0, 12806.0, 27134.0, 63513.0, 162218.0, 358599.0, 244046.0, 92637.0, 38225.0, 17397.0, 8386.0, 4161.0, 2243.0, 1335.0, 730.0, 427.0, 300.0, 175.0, 132.0, 86.0, 60.0, 37.0, 24.0, 11.0, 14.0, 17.0, 11.0, 6.0, 6.0, 5.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6904296875, -0.6671905517578125, -0.643951416015625, -0.6207122802734375, -0.59747314453125, -0.5742340087890625, -0.550994873046875, -0.5277557373046875, -0.5045166015625, -0.4812774658203125, -0.458038330078125, -0.4347991943359375, -0.41156005859375, -0.3883209228515625, -0.365081787109375, -0.3418426513671875, -0.318603515625, -0.2953643798828125, -0.272125244140625, -0.2488861083984375, -0.22564697265625, -0.2024078369140625, -0.179168701171875, -0.1559295654296875, -0.1326904296875, -0.1094512939453125, -0.086212158203125, -0.0629730224609375, -0.03973388671875, -0.0164947509765625, 0.006744384765625, 0.0299835205078125, 0.05322265625, 0.0764617919921875, 0.099700927734375, 0.1229400634765625, 0.14617919921875, 0.1694183349609375, 0.192657470703125, 0.2158966064453125, 0.2391357421875, 0.2623748779296875, 0.285614013671875, 0.3088531494140625, 0.33209228515625, 0.3553314208984375, 0.378570556640625, 0.4018096923828125, 0.425048828125, 0.4482879638671875, 0.471527099609375, 0.4947662353515625, 0.51800537109375, 0.5412445068359375, 0.564483642578125, 0.5877227783203125, 0.6109619140625, 0.6342010498046875, 0.657440185546875, 0.6806793212890625, 0.70391845703125, 0.7271575927734375, 0.750396728515625, 0.7736358642578125, 0.796875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 5.0, 11.0, 5.0, 22.0, 27.0, 24.0, 40.0, 32.0, 67.0, 67.0, 70.0, 70.0, 71.0, 72.0, 68.0, 68.0, 63.0, 46.0, 36.0, 40.0, 28.0, 20.0, 16.0, 8.0, 9.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.78369140625, -0.7509994506835938, -0.7183074951171875, -0.6856155395507812, -0.652923583984375, -0.6202316284179688, -0.5875396728515625, -0.5548477172851562, -0.52215576171875, -0.48946380615234375, -0.4567718505859375, -0.42407989501953125, -0.391387939453125, -0.35869598388671875, -0.3260040283203125, -0.29331207275390625, -0.2606201171875, -0.22792816162109375, -0.1952362060546875, -0.16254425048828125, -0.129852294921875, -0.09716033935546875, -0.0644683837890625, -0.03177642822265625, 0.00091552734375, 0.03360748291015625, 0.0662994384765625, 0.09899139404296875, 0.131683349609375, 0.16437530517578125, 0.1970672607421875, 0.22975921630859375, 0.262451171875, 0.29514312744140625, 0.3278350830078125, 0.36052703857421875, 0.393218994140625, 0.42591094970703125, 0.4586029052734375, 0.49129486083984375, 0.52398681640625, 0.5566787719726562, 0.5893707275390625, 0.6220626831054688, 0.654754638671875, 0.6874465942382812, 0.7201385498046875, 0.7528305053710938, 0.7855224609375, 0.8182144165039062, 0.8509063720703125, 0.8835983276367188, 0.916290283203125, 0.9489822387695312, 0.9816741943359375, 1.0143661499023438, 1.04705810546875, 1.0797500610351562, 1.1124420166015625, 1.1451339721679688, 1.177825927734375, 1.2105178833007812, 1.2432098388671875, 1.2759017944335938, 1.30859375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 7.0, 6.0, 6.0, 7.0, 10.0, 23.0, 30.0, 78.0, 228.0, 658.0, 3308.0, 63289.0, 937743.0, 39605.0, 2603.0, 590.0, 187.0, 81.0, 32.0, 23.0, 16.0, 7.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 7.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.466796875, -3.35992431640625, -3.2530517578125, -3.14617919921875, -3.039306640625, -2.93243408203125, -2.8255615234375, -2.71868896484375, -2.61181640625, -2.50494384765625, -2.3980712890625, -2.29119873046875, -2.184326171875, -2.07745361328125, -1.9705810546875, -1.86370849609375, -1.7568359375, -1.64996337890625, -1.5430908203125, -1.43621826171875, -1.329345703125, -1.22247314453125, -1.1156005859375, -1.00872802734375, -0.90185546875, -0.79498291015625, -0.6881103515625, -0.58123779296875, -0.474365234375, -0.36749267578125, -0.2606201171875, -0.15374755859375, -0.046875, 0.05999755859375, 0.1668701171875, 0.27374267578125, 0.380615234375, 0.48748779296875, 0.5943603515625, 0.70123291015625, 0.80810546875, 0.91497802734375, 1.0218505859375, 1.12872314453125, 1.235595703125, 1.34246826171875, 1.4493408203125, 1.55621337890625, 1.6630859375, 1.76995849609375, 1.8768310546875, 1.98370361328125, 2.090576171875, 2.19744873046875, 2.3043212890625, 2.41119384765625, 2.51806640625, 2.62493896484375, 2.7318115234375, 2.83868408203125, 2.945556640625, 3.05242919921875, 3.1593017578125, 3.26617431640625, 3.373046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 6.0, 11.0, 12.0, 14.0, 10.0, 20.0, 18.0, 27.0, 25.0, 27.0, 41.0, 44.0, 44.0, 40.0, 49.0, 41.0, 48.0, 43.0, 53.0, 43.0, 46.0, 45.0, 41.0, 43.0, 29.0, 30.0, 22.0, 18.0, 16.0, 17.0, 14.0, 11.0, 13.0, 6.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.52734375, -2.4532470703125, -2.379150390625, -2.3050537109375, -2.23095703125, -2.1568603515625, -2.082763671875, -2.0086669921875, -1.9345703125, -1.8604736328125, -1.786376953125, -1.7122802734375, -1.63818359375, -1.5640869140625, -1.489990234375, -1.4158935546875, -1.341796875, -1.2677001953125, -1.193603515625, -1.1195068359375, -1.04541015625, -0.9713134765625, -0.897216796875, -0.8231201171875, -0.7490234375, -0.6749267578125, -0.600830078125, -0.5267333984375, -0.45263671875, -0.3785400390625, -0.304443359375, -0.2303466796875, -0.15625, -0.0821533203125, -0.008056640625, 0.0660400390625, 0.14013671875, 0.2142333984375, 0.288330078125, 0.3624267578125, 0.4365234375, 0.5106201171875, 0.584716796875, 0.6588134765625, 0.73291015625, 0.8070068359375, 0.881103515625, 0.9552001953125, 1.029296875, 1.1033935546875, 1.177490234375, 1.2515869140625, 1.32568359375, 1.3997802734375, 1.473876953125, 1.5479736328125, 1.6220703125, 1.6961669921875, 1.770263671875, 1.8443603515625, 1.91845703125, 1.9925537109375, 2.066650390625, 2.1407470703125, 2.21484375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 6.0, 8.0, 22.0, 22.0, 47.0, 57.0, 155.0, 318.0, 1006.0, 7563.0, 935788.0, 99452.0, 2998.0, 635.0, 205.0, 119.0, 55.0, 35.0, 20.0, 14.0, 9.0, 5.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.484375, -2.403717041015625, -2.32305908203125, -2.242401123046875, -2.1617431640625, -2.081085205078125, -2.00042724609375, -1.919769287109375, -1.839111328125, -1.758453369140625, -1.67779541015625, -1.597137451171875, -1.5164794921875, -1.435821533203125, -1.35516357421875, -1.274505615234375, -1.19384765625, -1.113189697265625, -1.03253173828125, -0.951873779296875, -0.8712158203125, -0.790557861328125, -0.70989990234375, -0.629241943359375, -0.548583984375, -0.467926025390625, -0.38726806640625, -0.306610107421875, -0.2259521484375, -0.145294189453125, -0.06463623046875, 0.016021728515625, 0.0966796875, 0.177337646484375, 0.25799560546875, 0.338653564453125, 0.4193115234375, 0.499969482421875, 0.58062744140625, 0.661285400390625, 0.741943359375, 0.822601318359375, 0.90325927734375, 0.983917236328125, 1.0645751953125, 1.145233154296875, 1.22589111328125, 1.306549072265625, 1.38720703125, 1.467864990234375, 1.54852294921875, 1.629180908203125, 1.7098388671875, 1.790496826171875, 1.87115478515625, 1.951812744140625, 2.032470703125, 2.113128662109375, 2.19378662109375, 2.274444580078125, 2.3551025390625, 2.435760498046875, 2.51641845703125, 2.597076416015625, 2.677734375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 10.0, 6.0, 13.0, 18.0, 21.0, 31.0, 44.0, 73.0, 121.0, 210.0, 183.0, 95.0, 54.0, 38.0, 23.0, 17.0, 12.0, 6.0, 11.0, 7.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.00028061866760253906, -0.00027340464293956757, -0.00026619061827659607, -0.00025897659361362457, -0.0002517625689506531, -0.0002445485442876816, -0.00023733451962471008, -0.00023012049496173859, -0.0002229064702987671, -0.0002156924456357956, -0.0002084784209728241, -0.0002012643963098526, -0.0001940503716468811, -0.0001868363469839096, -0.0001796223223209381, -0.00017240829765796661, -0.00016519427299499512, -0.00015798024833202362, -0.00015076622366905212, -0.00014355219900608063, -0.00013633817434310913, -0.00012912414968013763, -0.00012191012501716614, -0.00011469610035419464, -0.00010748207569122314, -0.00010026805102825165, -9.305402636528015e-05, -8.584000170230865e-05, -7.862597703933716e-05, -7.141195237636566e-05, -6.419792771339417e-05, -5.698390305042267e-05, -4.976987838745117e-05, -4.2555853724479675e-05, -3.534182906150818e-05, -2.8127804398536682e-05, -2.0913779735565186e-05, -1.3699755072593689e-05, -6.485730409622192e-06, 7.282942533493042e-07, 7.9423189163208e-06, 1.5156343579292297e-05, 2.2370368242263794e-05, 2.958439290523529e-05, 3.679841756820679e-05, 4.4012442231178284e-05, 5.122646689414978e-05, 5.844049155712128e-05, 6.565451622009277e-05, 7.286854088306427e-05, 8.008256554603577e-05, 8.729659020900726e-05, 9.451061487197876e-05, 0.00010172463953495026, 0.00010893866419792175, 0.00011615268886089325, 0.00012336671352386475, 0.00013058073818683624, 0.00013779476284980774, 0.00014500878751277924, 0.00015222281217575073, 0.00015943683683872223, 0.00016665086150169373, 0.00017386488616466522, 0.00018107891082763672]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 11.0, 11.0, 11.0, 19.0, 22.0, 44.0, 109.0, 223.0, 684.0, 2859.0, 24945.0, 861584.0, 148053.0, 7833.0, 1422.0, 410.0, 144.0, 71.0, 39.0, 18.0, 13.0, 14.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.490234375, -1.4433135986328125, -1.396392822265625, -1.3494720458984375, -1.30255126953125, -1.2556304931640625, -1.208709716796875, -1.1617889404296875, -1.1148681640625, -1.0679473876953125, -1.021026611328125, -0.9741058349609375, -0.92718505859375, -0.8802642822265625, -0.833343505859375, -0.7864227294921875, -0.739501953125, -0.6925811767578125, -0.645660400390625, -0.5987396240234375, -0.55181884765625, -0.5048980712890625, -0.457977294921875, -0.4110565185546875, -0.3641357421875, -0.3172149658203125, -0.270294189453125, -0.2233734130859375, -0.17645263671875, -0.1295318603515625, -0.082611083984375, -0.0356903076171875, 0.01123046875, 0.0581512451171875, 0.105072021484375, 0.1519927978515625, 0.19891357421875, 0.2458343505859375, 0.292755126953125, 0.3396759033203125, 0.3865966796875, 0.4335174560546875, 0.480438232421875, 0.5273590087890625, 0.57427978515625, 0.6212005615234375, 0.668121337890625, 0.7150421142578125, 0.761962890625, 0.8088836669921875, 0.855804443359375, 0.9027252197265625, 0.94964599609375, 0.9965667724609375, 1.043487548828125, 1.0904083251953125, 1.1373291015625, 1.1842498779296875, 1.231170654296875, 1.2780914306640625, 1.32501220703125, 1.3719329833984375, 1.418853759765625, 1.4657745361328125, 1.5126953125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 1.0, 2.0, 12.0, 7.0, 12.0, 20.0, 33.0, 34.0, 55.0, 70.0, 87.0, 143.0, 115.0, 103.0, 89.0, 61.0, 46.0, 42.0, 14.0, 18.0, 3.0, 4.0, 10.0, 8.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62744140625, -0.6015548706054688, -0.5756683349609375, -0.5497817993164062, -0.523895263671875, -0.49800872802734375, -0.4721221923828125, -0.44623565673828125, -0.42034912109375, -0.39446258544921875, -0.3685760498046875, -0.34268951416015625, -0.316802978515625, -0.29091644287109375, -0.2650299072265625, -0.23914337158203125, -0.2132568359375, -0.18737030029296875, -0.1614837646484375, -0.13559722900390625, -0.109710693359375, -0.08382415771484375, -0.0579376220703125, -0.03205108642578125, -0.00616455078125, 0.01972198486328125, 0.0456085205078125, 0.07149505615234375, 0.097381591796875, 0.12326812744140625, 0.1491546630859375, 0.17504119873046875, 0.200927734375, 0.22681427001953125, 0.2527008056640625, 0.27858734130859375, 0.304473876953125, 0.33036041259765625, 0.3562469482421875, 0.38213348388671875, 0.40802001953125, 0.43390655517578125, 0.4597930908203125, 0.48567962646484375, 0.511566162109375, 0.5374526977539062, 0.5633392333984375, 0.5892257690429688, 0.6151123046875, 0.6409988403320312, 0.6668853759765625, 0.6927719116210938, 0.718658447265625, 0.7445449829101562, 0.7704315185546875, 0.7963180541992188, 0.82220458984375, 0.8480911254882812, 0.8739776611328125, 0.8998641967773438, 0.925750732421875, 0.9516372680664062, 0.9775238037109375, 1.0034103393554688, 1.029296875]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 10.0, 10.0, 41.0, 330.0, 535.0, 73.0, 9.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.299774169921875, -20.925472259521484, -19.55116844177246, -18.17686653137207, -16.802562713623047, -15.428260803222656, -14.053958892822266, -12.679656028747559, -11.305353164672852, -9.931050300598145, -8.556747436523438, -7.182445526123047, -5.80814266204834, -4.433839797973633, -3.059537887573242, -1.6852350234985352, -0.3109321594238281, 1.0633704662322998, 2.4376730918884277, 3.8119754791259766, 5.186278343200684, 6.560581207275391, 7.934883117675781, 9.309185981750488, 10.683488845825195, 12.057791709899902, 13.43209457397461, 14.806396484375, 16.18069839477539, 17.555002212524414, 18.929304122924805, 20.303607940673828, 21.67790985107422, 23.05221176147461, 24.426515579223633, 25.800817489624023, 27.175121307373047, 28.549423217773438, 29.923725128173828, 31.29802703857422, 32.672332763671875, 34.046634674072266, 35.420936584472656, 36.79524230957031, 38.1695442199707, 39.543846130371094, 40.918148040771484, 42.292449951171875, 43.666751861572266, 45.041053771972656, 46.41535568237305, 47.78965759277344, 49.163963317871094, 50.538265228271484, 51.912567138671875, 53.286869049072266, 54.661170959472656, 56.03547286987305, 57.40977478027344, 58.784080505371094, 60.158382415771484, 61.532684326171875, 62.906986236572266, 64.28128814697266, 65.65559387207031]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 2.0, 5.0, 2.0, 10.0, 7.0, 8.0, 9.0, 8.0, 13.0, 17.0, 17.0, 8.0, 19.0, 18.0, 16.0, 21.0, 19.0, 38.0, 26.0, 36.0, 36.0, 44.0, 41.0, 47.0, 56.0, 56.0, 46.0, 36.0, 45.0, 27.0, 24.0, 30.0, 25.0, 25.0, 22.0, 12.0, 17.0, 24.0, 14.0, 9.0, 9.0, 10.0, 14.0, 6.0, 6.0, 4.0, 3.0, 5.0, 7.0, 1.0, 0.0, 2.0, 2.0, 5.0], "bins": [-8.969715118408203, -8.70808219909668, -8.44644832611084, -8.184815406799316, -7.923182010650635, -7.661548614501953, -7.39991569519043, -7.138282299041748, -6.876648902893066, -6.615015506744385, -6.353382587432861, -6.09174919128418, -5.830115795135498, -5.568482398986816, -5.306849479675293, -5.045216083526611, -4.783583164215088, -4.521949768066406, -4.260316848754883, -3.998683452606201, -3.7370500564575195, -3.475416898727417, -3.2137837409973145, -2.952150344848633, -2.6905171871185303, -2.4288840293884277, -2.167250633239746, -1.9056174755096436, -1.6439841985702515, -1.3823509216308594, -1.1207177639007568, -0.8590844869613647, -0.5974512100219727, -0.33581796288490295, -0.07418471574783325, 0.18744850158691406, 0.44908177852630615, 0.7107150554656982, 0.9723482131958008, 1.2339814901351929, 1.495614767074585, 1.757248044013977, 2.018881320953369, 2.2805144786834717, 2.542147636413574, 2.803781032562256, 3.0654141902923584, 3.327047348022461, 3.5886807441711426, 3.850313901901245, 4.111947059631348, 4.373580455780029, 4.635213851928711, 4.896846771240234, 5.158480167388916, 5.420113563537598, 5.681746482849121, 5.943379878997803, 6.205012798309326, 6.466646194458008, 6.7282795906066895, 6.989912986755371, 7.2515459060668945, 7.513179302215576, 7.774812698364258]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 1.0, 4.0, 4.0, 6.0, 11.0, 11.0, 24.0, 31.0, 63.0, 98.0, 188.0, 365.0, 1023.0, 4124.0, 29034.0, 906618.0, 3149486.0, 92306.0, 7703.0, 1785.0, 631.0, 301.0, 157.0, 112.0, 68.0, 43.0, 32.0, 21.0, 12.0, 7.0, 7.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4140625, -1.3672637939453125, -1.320465087890625, -1.2736663818359375, -1.22686767578125, -1.1800689697265625, -1.133270263671875, -1.0864715576171875, -1.0396728515625, -0.9928741455078125, -0.946075439453125, -0.8992767333984375, -0.85247802734375, -0.8056793212890625, -0.758880615234375, -0.7120819091796875, -0.665283203125, -0.6184844970703125, -0.571685791015625, -0.5248870849609375, -0.47808837890625, -0.4312896728515625, -0.384490966796875, -0.3376922607421875, -0.2908935546875, -0.2440948486328125, -0.197296142578125, -0.1504974365234375, -0.10369873046875, -0.0569000244140625, -0.010101318359375, 0.0366973876953125, 0.08349609375, 0.1302947998046875, 0.177093505859375, 0.2238922119140625, 0.27069091796875, 0.3174896240234375, 0.364288330078125, 0.4110870361328125, 0.4578857421875, 0.5046844482421875, 0.551483154296875, 0.5982818603515625, 0.64508056640625, 0.6918792724609375, 0.738677978515625, 0.7854766845703125, 0.832275390625, 0.8790740966796875, 0.925872802734375, 0.9726715087890625, 1.01947021484375, 1.0662689208984375, 1.113067626953125, 1.1598663330078125, 1.2066650390625, 1.2534637451171875, 1.300262451171875, 1.3470611572265625, 1.39385986328125, 1.4406585693359375, 1.487457275390625, 1.5342559814453125, 1.5810546875]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 7.0, 9.0, 14.0, 17.0, 22.0, 42.0, 44.0, 51.0, 72.0, 73.0, 69.0, 79.0, 78.0, 84.0, 83.0, 56.0, 49.0, 38.0, 24.0, 24.0, 22.0, 20.0, 8.0, 6.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78857421875, -0.7558364868164062, -0.7230987548828125, -0.6903610229492188, -0.657623291015625, -0.6248855590820312, -0.5921478271484375, -0.5594100952148438, -0.52667236328125, -0.49393463134765625, -0.4611968994140625, -0.42845916748046875, -0.395721435546875, -0.36298370361328125, -0.3302459716796875, -0.29750823974609375, -0.2647705078125, -0.23203277587890625, -0.1992950439453125, -0.16655731201171875, -0.133819580078125, -0.10108184814453125, -0.0683441162109375, -0.03560638427734375, -0.00286865234375, 0.02986907958984375, 0.0626068115234375, 0.09534454345703125, 0.128082275390625, 0.16082000732421875, 0.1935577392578125, 0.22629547119140625, 0.259033203125, 0.29177093505859375, 0.3245086669921875, 0.35724639892578125, 0.389984130859375, 0.42272186279296875, 0.4554595947265625, 0.48819732666015625, 0.52093505859375, 0.5536727905273438, 0.5864105224609375, 0.6191482543945312, 0.651885986328125, 0.6846237182617188, 0.7173614501953125, 0.7500991821289062, 0.7828369140625, 0.8155746459960938, 0.8483123779296875, 0.8810501098632812, 0.913787841796875, 0.9465255737304688, 0.9792633056640625, 1.0120010375976562, 1.04473876953125, 1.0774765014648438, 1.1102142333984375, 1.1429519653320312, 1.175689697265625, 1.2084274291992188, 1.2411651611328125, 1.2739028930664062, 1.306640625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 8.0, 12.0, 10.0, 19.0, 44.0, 90.0, 159.0, 404.0, 1320.0, 5454.0, 43327.0, 1765612.0, 2313890.0, 55299.0, 6158.0, 1537.0, 493.0, 203.0, 97.0, 45.0, 33.0, 20.0, 17.0, 13.0, 12.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8623046875, -1.8106231689453125, -1.758941650390625, -1.7072601318359375, -1.65557861328125, -1.6038970947265625, -1.552215576171875, -1.5005340576171875, -1.4488525390625, -1.3971710205078125, -1.345489501953125, -1.2938079833984375, -1.24212646484375, -1.1904449462890625, -1.138763427734375, -1.0870819091796875, -1.035400390625, -0.9837188720703125, -0.932037353515625, -0.8803558349609375, -0.82867431640625, -0.7769927978515625, -0.725311279296875, -0.6736297607421875, -0.6219482421875, -0.5702667236328125, -0.518585205078125, -0.4669036865234375, -0.41522216796875, -0.3635406494140625, -0.311859130859375, -0.2601776123046875, -0.20849609375, -0.1568145751953125, -0.105133056640625, -0.0534515380859375, -0.00177001953125, 0.0499114990234375, 0.101593017578125, 0.1532745361328125, 0.2049560546875, 0.2566375732421875, 0.308319091796875, 0.3600006103515625, 0.41168212890625, 0.4633636474609375, 0.515045166015625, 0.5667266845703125, 0.618408203125, 0.6700897216796875, 0.721771240234375, 0.7734527587890625, 0.82513427734375, 0.8768157958984375, 0.928497314453125, 0.9801788330078125, 1.0318603515625, 1.0835418701171875, 1.135223388671875, 1.1869049072265625, 1.23858642578125, 1.2902679443359375, 1.341949462890625, 1.3936309814453125, 1.4453125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 5.0, 8.0, 11.0, 15.0, 19.0, 56.0, 59.0, 116.0, 181.0, 314.0, 515.0, 686.0, 738.0, 501.0, 331.0, 162.0, 125.0, 64.0, 46.0, 33.0, 15.0, 16.0, 14.0, 7.0, 11.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.33984375, -1.29791259765625, -1.2559814453125, -1.21405029296875, -1.172119140625, -1.13018798828125, -1.0882568359375, -1.04632568359375, -1.00439453125, -0.96246337890625, -0.9205322265625, -0.87860107421875, -0.836669921875, -0.79473876953125, -0.7528076171875, -0.71087646484375, -0.6689453125, -0.62701416015625, -0.5850830078125, -0.54315185546875, -0.501220703125, -0.45928955078125, -0.4173583984375, -0.37542724609375, -0.33349609375, -0.29156494140625, -0.2496337890625, -0.20770263671875, -0.165771484375, -0.12384033203125, -0.0819091796875, -0.03997802734375, 0.001953125, 0.04388427734375, 0.0858154296875, 0.12774658203125, 0.169677734375, 0.21160888671875, 0.2535400390625, 0.29547119140625, 0.33740234375, 0.37933349609375, 0.4212646484375, 0.46319580078125, 0.505126953125, 0.54705810546875, 0.5889892578125, 0.63092041015625, 0.6728515625, 0.71478271484375, 0.7567138671875, 0.79864501953125, 0.840576171875, 0.88250732421875, 0.9244384765625, 0.96636962890625, 1.00830078125, 1.05023193359375, 1.0921630859375, 1.13409423828125, 1.176025390625, 1.21795654296875, 1.2598876953125, 1.30181884765625, 1.34375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 11.0, 24.0, 50.0, 95.0, 142.0, 166.0, 176.0, 132.0, 65.0, 44.0, 28.0, 10.0, 10.0, 11.0, 3.0, 4.0, 3.0, 4.0, 3.0, 2.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.9011030197143555, -6.560537338256836, -6.219971656799316, -5.879405975341797, -5.538840293884277, -5.198274612426758, -4.857708930969238, -4.517143249511719, -4.176577568054199, -3.8360118865966797, -3.49544620513916, -3.1548805236816406, -2.814314842224121, -2.4737491607666016, -2.133183717727661, -1.7926180362701416, -1.4520525932312012, -1.1114869117736816, -0.7709212899208069, -0.43035566806793213, -0.0897899866104126, 0.25077569484710693, 0.5913412570953369, 0.9319069385528564, 1.272472620010376, 1.6130383014678955, 1.953603982925415, 2.2941694259643555, 2.634735107421875, 2.9753007888793945, 3.315866470336914, 3.6564321517944336, 3.996997833251953, 4.337563514709473, 4.678129196166992, 5.018694877624512, 5.359260559082031, 5.699826240539551, 6.04039192199707, 6.38095760345459, 6.721523284912109, 7.062088966369629, 7.402654647827148, 7.743220329284668, 8.083786010742188, 8.424351692199707, 8.764917373657227, 9.105483055114746, 9.446048736572266, 9.786614418029785, 10.127180099487305, 10.467745780944824, 10.808311462402344, 11.148877143859863, 11.489442825317383, 11.830008506774902, 12.170573234558105, 12.511138916015625, 12.851704597473145, 13.192270278930664, 13.532835960388184, 13.873401641845703, 14.213967323303223, 14.554533004760742, 14.895098686218262]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 8.0, 9.0, 6.0, 9.0, 10.0, 18.0, 8.0, 11.0, 20.0, 26.0, 25.0, 30.0, 31.0, 28.0, 38.0, 46.0, 47.0, 43.0, 40.0, 55.0, 43.0, 48.0, 44.0, 39.0, 45.0, 42.0, 35.0, 38.0, 29.0, 30.0, 18.0, 19.0, 12.0, 8.0, 8.0, 6.0, 10.0, 3.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.8602705001831055, -6.667733192443848, -6.47519588470459, -6.282658576965332, -6.090120792388916, -5.897583484649658, -5.7050461769104, -5.512508869171143, -5.319971561431885, -5.127434253692627, -4.934896945953369, -4.742359161376953, -4.549821853637695, -4.3572845458984375, -4.16474723815918, -3.972209930419922, -3.779672384262085, -3.587135076522827, -3.3945975303649902, -3.2020602226257324, -3.0095229148864746, -2.816985607147217, -2.62444806098938, -2.431910753250122, -2.239373207092285, -2.0468358993530273, -1.85429847240448, -1.6617610454559326, -1.4692237377166748, -1.2766863107681274, -1.08414888381958, -0.8916115760803223, -0.6990742683410645, -0.5065369009971619, -0.3139995038509369, -0.12146210670471191, 0.07107526063919067, 0.26361262798309326, 0.4561500549316406, 0.6486873626708984, 0.8412247896194458, 1.0337622165679932, 1.226299524307251, 1.4188369512557983, 1.6113743782043457, 1.8039116859436035, 1.9964491128921509, 2.188986301422119, 2.381523847579956, 2.574061155319214, 2.766598701477051, 2.9591360092163086, 3.1516733169555664, 3.344210624694824, 3.536748170852661, 3.729285478591919, 3.921823024749756, 4.114360332489014, 4.3068976402282715, 4.4994354248046875, 4.691972732543945, 4.884510040283203, 5.077047348022461, 5.269584655761719, 5.462121963500977]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 9.0, 18.0, 30.0, 43.0, 58.0, 71.0, 118.0, 175.0, 253.0, 375.0, 612.0, 1181.0, 1931.0, 3795.0, 7262.0, 14744.0, 31656.0, 70601.0, 156511.0, 299573.0, 245758.0, 114971.0, 51717.0, 23478.0, 11277.0, 5522.0, 2857.0, 1530.0, 891.0, 522.0, 332.0, 216.0, 129.0, 103.0, 94.0, 34.0, 31.0, 26.0, 11.0, 8.0, 10.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.654296875, -0.633056640625, -0.61181640625, -0.590576171875, -0.5693359375, -0.548095703125, -0.52685546875, -0.505615234375, -0.484375, -0.463134765625, -0.44189453125, -0.420654296875, -0.3994140625, -0.378173828125, -0.35693359375, -0.335693359375, -0.314453125, -0.293212890625, -0.27197265625, -0.250732421875, -0.2294921875, -0.208251953125, -0.18701171875, -0.165771484375, -0.14453125, -0.123291015625, -0.10205078125, -0.080810546875, -0.0595703125, -0.038330078125, -0.01708984375, 0.004150390625, 0.025390625, 0.046630859375, 0.06787109375, 0.089111328125, 0.1103515625, 0.131591796875, 0.15283203125, 0.174072265625, 0.1953125, 0.216552734375, 0.23779296875, 0.259033203125, 0.2802734375, 0.301513671875, 0.32275390625, 0.343994140625, 0.365234375, 0.386474609375, 0.40771484375, 0.428955078125, 0.4501953125, 0.471435546875, 0.49267578125, 0.513916015625, 0.53515625, 0.556396484375, 0.57763671875, 0.598876953125, 0.6201171875, 0.641357421875, 0.66259765625, 0.683837890625, 0.705078125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 8.0, 11.0, 20.0, 21.0, 32.0, 47.0, 52.0, 71.0, 65.0, 77.0, 80.0, 87.0, 61.0, 70.0, 64.0, 60.0, 35.0, 40.0, 28.0, 16.0, 19.0, 13.0, 5.0, 8.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75927734375, -0.7268295288085938, -0.6943817138671875, -0.6619338989257812, -0.629486083984375, -0.5970382690429688, -0.5645904541015625, -0.5321426391601562, -0.49969482421875, -0.46724700927734375, -0.4347991943359375, -0.40235137939453125, -0.369903564453125, -0.33745574951171875, -0.3050079345703125, -0.27256011962890625, -0.2401123046875, -0.20766448974609375, -0.1752166748046875, -0.14276885986328125, -0.110321044921875, -0.07787322998046875, -0.0454254150390625, -0.01297760009765625, 0.01947021484375, 0.05191802978515625, 0.0843658447265625, 0.11681365966796875, 0.149261474609375, 0.18170928955078125, 0.2141571044921875, 0.24660491943359375, 0.279052734375, 0.31150054931640625, 0.3439483642578125, 0.37639617919921875, 0.408843994140625, 0.44129180908203125, 0.4737396240234375, 0.5061874389648438, 0.53863525390625, 0.5710830688476562, 0.6035308837890625, 0.6359786987304688, 0.668426513671875, 0.7008743286132812, 0.7333221435546875, 0.7657699584960938, 0.7982177734375, 0.8306655883789062, 0.8631134033203125, 0.8955612182617188, 0.928009033203125, 0.9604568481445312, 0.9929046630859375, 1.0253524780273438, 1.05780029296875, 1.0902481079101562, 1.1226959228515625, 1.1551437377929688, 1.187591552734375, 1.2200393676757812, 1.2524871826171875, 1.2849349975585938, 1.3173828125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 3.0, 3.0, 2.0, 4.0, 6.0, 7.0, 6.0, 13.0, 11.0, 19.0, 21.0, 42.0, 30.0, 61.0, 76.0, 102.0, 161.0, 177.0, 229.0, 327.0, 508.0, 737.0, 1232.0, 2058.0, 4297.0, 12546.0, 53901.0, 338211.0, 538687.0, 68471.0, 15347.0, 5055.0, 2295.0, 1244.0, 815.0, 548.0, 355.0, 258.0, 188.0, 130.0, 96.0, 74.0, 58.0, 39.0, 29.0, 25.0, 14.0, 18.0, 13.0, 1.0, 7.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3876953125, -1.3430328369140625, -1.298370361328125, -1.2537078857421875, -1.20904541015625, -1.1643829345703125, -1.119720458984375, -1.0750579833984375, -1.0303955078125, -0.9857330322265625, -0.941070556640625, -0.8964080810546875, -0.85174560546875, -0.8070831298828125, -0.762420654296875, -0.7177581787109375, -0.673095703125, -0.6284332275390625, -0.583770751953125, -0.5391082763671875, -0.49444580078125, -0.4497833251953125, -0.405120849609375, -0.3604583740234375, -0.3157958984375, -0.2711334228515625, -0.226470947265625, -0.1818084716796875, -0.13714599609375, -0.0924835205078125, -0.047821044921875, -0.0031585693359375, 0.04150390625, 0.0861663818359375, 0.130828857421875, 0.1754913330078125, 0.22015380859375, 0.2648162841796875, 0.309478759765625, 0.3541412353515625, 0.3988037109375, 0.4434661865234375, 0.488128662109375, 0.5327911376953125, 0.57745361328125, 0.6221160888671875, 0.666778564453125, 0.7114410400390625, 0.756103515625, 0.8007659912109375, 0.845428466796875, 0.8900909423828125, 0.93475341796875, 0.9794158935546875, 1.024078369140625, 1.0687408447265625, 1.1134033203125, 1.1580657958984375, 1.202728271484375, 1.2473907470703125, 1.29205322265625, 1.3367156982421875, 1.381378173828125, 1.4260406494140625, 1.470703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 1.0, 7.0, 5.0, 8.0, 10.0, 9.0, 14.0, 16.0, 14.0, 20.0, 21.0, 29.0, 23.0, 34.0, 31.0, 39.0, 50.0, 51.0, 56.0, 51.0, 50.0, 51.0, 45.0, 53.0, 42.0, 43.0, 34.0, 36.0, 29.0, 25.0, 24.0, 16.0, 11.0, 8.0, 8.0, 10.0, 6.0, 9.0, 3.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.228515625, -3.13232421875, -3.0361328125, -2.93994140625, -2.84375, -2.74755859375, -2.6513671875, -2.55517578125, -2.458984375, -2.36279296875, -2.2666015625, -2.17041015625, -2.07421875, -1.97802734375, -1.8818359375, -1.78564453125, -1.689453125, -1.59326171875, -1.4970703125, -1.40087890625, -1.3046875, -1.20849609375, -1.1123046875, -1.01611328125, -0.919921875, -0.82373046875, -0.7275390625, -0.63134765625, -0.53515625, -0.43896484375, -0.3427734375, -0.24658203125, -0.150390625, -0.05419921875, 0.0419921875, 0.13818359375, 0.234375, 0.33056640625, 0.4267578125, 0.52294921875, 0.619140625, 0.71533203125, 0.8115234375, 0.90771484375, 1.00390625, 1.10009765625, 1.1962890625, 1.29248046875, 1.388671875, 1.48486328125, 1.5810546875, 1.67724609375, 1.7734375, 1.86962890625, 1.9658203125, 2.06201171875, 2.158203125, 2.25439453125, 2.3505859375, 2.44677734375, 2.54296875, 2.63916015625, 2.7353515625, 2.83154296875, 2.927734375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 7.0, 12.0, 22.0, 31.0, 35.0, 38.0, 60.0, 85.0, 144.0, 251.0, 395.0, 658.0, 1284.0, 2321.0, 5243.0, 13971.0, 47199.0, 208143.0, 630107.0, 97120.0, 25403.0, 8370.0, 3524.0, 1710.0, 963.0, 511.0, 316.0, 205.0, 126.0, 81.0, 67.0, 52.0, 26.0, 23.0, 6.0, 9.0, 11.0, 6.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0], "bins": [-0.73046875, -0.7113761901855469, -0.6922836303710938, -0.6731910705566406, -0.6540985107421875, -0.6350059509277344, -0.6159133911132812, -0.5968208312988281, -0.577728271484375, -0.5586357116699219, -0.5395431518554688, -0.5204505920410156, -0.5013580322265625, -0.4822654724121094, -0.46317291259765625, -0.4440803527832031, -0.42498779296875, -0.4058952331542969, -0.38680267333984375, -0.3677101135253906, -0.3486175537109375, -0.3295249938964844, -0.31043243408203125, -0.2913398742675781, -0.272247314453125, -0.2531547546386719, -0.23406219482421875, -0.21496963500976562, -0.1958770751953125, -0.17678451538085938, -0.15769195556640625, -0.13859939575195312, -0.1195068359375, -0.10041427612304688, -0.08132171630859375, -0.062229156494140625, -0.0431365966796875, -0.024044036865234375, -0.00495147705078125, 0.014141082763671875, 0.033233642578125, 0.052326202392578125, 0.07141876220703125, 0.09051132202148438, 0.1096038818359375, 0.12869644165039062, 0.14778900146484375, 0.16688156127929688, 0.18597412109375, 0.20506668090820312, 0.22415924072265625, 0.24325180053710938, 0.2623443603515625, 0.2814369201660156, 0.30052947998046875, 0.3196220397949219, 0.338714599609375, 0.3578071594238281, 0.37689971923828125, 0.3959922790527344, 0.4150848388671875, 0.4341773986816406, 0.45326995849609375, 0.4723625183105469, 0.491455078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 1.0, 6.0, 3.0, 7.0, 8.0, 5.0, 14.0, 10.0, 12.0, 17.0, 25.0, 31.0, 32.0, 41.0, 33.0, 67.0, 94.0, 156.0, 105.0, 65.0, 55.0, 35.0, 25.0, 32.0, 23.0, 14.0, 14.0, 11.0, 20.0, 2.0, 15.0, 6.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0001819133758544922, -0.00017593801021575928, -0.00016996264457702637, -0.00016398727893829346, -0.00015801191329956055, -0.00015203654766082764, -0.00014606118202209473, -0.00014008581638336182, -0.0001341104507446289, -0.000128135085105896, -0.00012215971946716309, -0.00011618435382843018, -0.00011020898818969727, -0.00010423362255096436, -9.825825691223145e-05, -9.228289127349854e-05, -8.630752563476562e-05, -8.033215999603271e-05, -7.43567943572998e-05, -6.83814287185669e-05, -6.240606307983398e-05, -5.6430697441101074e-05, -5.0455331802368164e-05, -4.4479966163635254e-05, -3.8504600524902344e-05, -3.2529234886169434e-05, -2.6553869247436523e-05, -2.0578503608703613e-05, -1.4603137969970703e-05, -8.627772331237793e-06, -2.652406692504883e-06, 3.3229589462280273e-06, 9.298324584960938e-06, 1.5273690223693848e-05, 2.1249055862426758e-05, 2.7224421501159668e-05, 3.319978713989258e-05, 3.917515277862549e-05, 4.51505184173584e-05, 5.112588405609131e-05, 5.710124969482422e-05, 6.307661533355713e-05, 6.905198097229004e-05, 7.502734661102295e-05, 8.100271224975586e-05, 8.697807788848877e-05, 9.295344352722168e-05, 9.892880916595459e-05, 0.0001049041748046875, 0.00011087954044342041, 0.00011685490608215332, 0.00012283027172088623, 0.00012880563735961914, 0.00013478100299835205, 0.00014075636863708496, 0.00014673173427581787, 0.00015270709991455078, 0.0001586824655532837, 0.0001646578311920166, 0.0001706331968307495, 0.00017660856246948242, 0.00018258392810821533, 0.00018855929374694824, 0.00019453465938568115, 0.00020051002502441406]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 7.0, 10.0, 13.0, 20.0, 22.0, 51.0, 74.0, 106.0, 177.0, 352.0, 560.0, 1134.0, 2542.0, 7164.0, 29033.0, 207226.0, 710494.0, 68712.0, 13273.0, 4045.0, 1630.0, 816.0, 435.0, 236.0, 139.0, 86.0, 52.0, 42.0, 21.0, 24.0, 12.0, 7.0, 11.0, 6.0, 3.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9765625, -0.9488525390625, -0.921142578125, -0.8934326171875, -0.86572265625, -0.8380126953125, -0.810302734375, -0.7825927734375, -0.7548828125, -0.7271728515625, -0.699462890625, -0.6717529296875, -0.64404296875, -0.6163330078125, -0.588623046875, -0.5609130859375, -0.533203125, -0.5054931640625, -0.477783203125, -0.4500732421875, -0.42236328125, -0.3946533203125, -0.366943359375, -0.3392333984375, -0.3115234375, -0.2838134765625, -0.256103515625, -0.2283935546875, -0.20068359375, -0.1729736328125, -0.145263671875, -0.1175537109375, -0.08984375, -0.0621337890625, -0.034423828125, -0.0067138671875, 0.02099609375, 0.0487060546875, 0.076416015625, 0.1041259765625, 0.1318359375, 0.1595458984375, 0.187255859375, 0.2149658203125, 0.24267578125, 0.2703857421875, 0.298095703125, 0.3258056640625, 0.353515625, 0.3812255859375, 0.408935546875, 0.4366455078125, 0.46435546875, 0.4920654296875, 0.519775390625, 0.5474853515625, 0.5751953125, 0.6029052734375, 0.630615234375, 0.6583251953125, 0.68603515625, 0.7137451171875, 0.741455078125, 0.7691650390625, 0.796875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 10.0, 6.0, 8.0, 20.0, 19.0, 38.0, 46.0, 48.0, 89.0, 98.0, 131.0, 116.0, 103.0, 82.0, 42.0, 33.0, 34.0, 18.0, 7.0, 8.0, 12.0, 9.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.96435546875, -0.9340133666992188, -0.9036712646484375, -0.8733291625976562, -0.842987060546875, -0.8126449584960938, -0.7823028564453125, -0.7519607543945312, -0.72161865234375, -0.6912765502929688, -0.6609344482421875, -0.6305923461914062, -0.600250244140625, -0.5699081420898438, -0.5395660400390625, -0.5092239379882812, -0.4788818359375, -0.44853973388671875, -0.4181976318359375, -0.38785552978515625, -0.357513427734375, -0.32717132568359375, -0.2968292236328125, -0.26648712158203125, -0.23614501953125, -0.20580291748046875, -0.1754608154296875, -0.14511871337890625, -0.114776611328125, -0.08443450927734375, -0.0540924072265625, -0.02375030517578125, 0.006591796875, 0.03693389892578125, 0.0672760009765625, 0.09761810302734375, 0.127960205078125, 0.15830230712890625, 0.1886444091796875, 0.21898651123046875, 0.24932861328125, 0.27967071533203125, 0.3100128173828125, 0.34035491943359375, 0.370697021484375, 0.40103912353515625, 0.4313812255859375, 0.46172332763671875, 0.4920654296875, 0.5224075317382812, 0.5527496337890625, 0.5830917358398438, 0.613433837890625, 0.6437759399414062, 0.6741180419921875, 0.7044601440429688, 0.73480224609375, 0.7651443481445312, 0.7954864501953125, 0.8258285522460938, 0.856170654296875, 0.8865127563476562, 0.9168548583984375, 0.9471969604492188, 0.9775390625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 8.0, 12.0, 28.0, 69.0, 137.0, 274.0, 253.0, 115.0, 40.0, 26.0, 8.0, 7.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.469467163085938, -20.856014251708984, -20.242563247680664, -19.62911033630371, -19.015657424926758, -18.402206420898438, -17.788753509521484, -17.17530059814453, -16.56184959411621, -15.948397636413574, -15.334944725036621, -14.721492767333984, -14.108040809631348, -13.494588851928711, -12.881135940551758, -12.267683982849121, -11.654231071472168, -11.040779113769531, -10.427326202392578, -9.813874244689941, -9.200422286987305, -8.586969375610352, -7.973517417907715, -7.360065460205078, -6.746613025665283, -6.133160591125488, -5.519708633422852, -4.906256198883057, -4.292803764343262, -3.679351806640625, -3.06589937210083, -2.4524474143981934, -1.8389949798583984, -1.2255427837371826, -0.6120904684066772, 0.001361846923828125, 0.614814043045044, 1.2282662391662598, 1.8417186737060547, 2.4551706314086914, 3.0686230659484863, 3.682075262069702, 4.295527458190918, 4.908979892730713, 5.522432327270508, 6.1358842849731445, 6.7493367195129395, 7.362788677215576, 7.976241111755371, 8.589693069458008, 9.203145980834961, 9.816597938537598, 10.430049896240234, 11.043502807617188, 11.656954765319824, 12.270406723022461, 12.883859634399414, 13.49731159210205, 14.110764503479004, 14.72421646118164, 15.337668418884277, 15.951120376586914, 16.564573287963867, 17.178024291992188, 17.79147720336914]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 8.0, 5.0, 4.0, 15.0, 15.0, 18.0, 17.0, 24.0, 30.0, 25.0, 25.0, 27.0, 21.0, 29.0, 37.0, 39.0, 43.0, 73.0, 55.0, 58.0, 66.0, 36.0, 37.0, 28.0, 33.0, 21.0, 27.0, 25.0, 22.0, 19.0, 18.0, 18.0, 6.0, 27.0, 8.0, 6.0, 13.0, 3.0, 2.0, 1.0, 3.0, 6.0, 4.0, 1.0, 1.0, 0.0, 4.0], "bins": [-11.630964279174805, -11.303140640258789, -10.975316047668457, -10.647492408752441, -10.31966781616211, -9.991844177246094, -9.664020538330078, -9.336196899414062, -9.00837230682373, -8.680548667907715, -8.352724075317383, -8.024900436401367, -7.697076320648193, -7.3692522048950195, -7.041428565979004, -6.71360445022583, -6.385780334472656, -6.057956218719482, -5.730132102966309, -5.402308464050293, -5.074484348297119, -4.746660232543945, -4.41883659362793, -4.091012477874756, -3.763188362121582, -3.435364246368408, -3.1075403690338135, -2.7797164916992188, -2.451892375946045, -2.124068260192871, -1.7962443828582764, -1.4684205055236816, -1.1405963897705078, -0.8127723932266235, -0.48494839668273926, -0.15712440013885498, 0.1706995964050293, 0.4985235929489136, 0.8263475894927979, 1.1541714668273926, 1.4819955825805664, 1.8098195791244507, 2.137643575668335, 2.4654674530029297, 2.7932915687561035, 3.1211156845092773, 3.448939561843872, 3.776763439178467, 4.104587554931641, 4.4324116706848145, 4.760235786437988, 5.088059425354004, 5.415883541107178, 5.743707656860352, 6.071531295776367, 6.399355411529541, 6.727179527282715, 7.055003643035889, 7.3828277587890625, 7.710651397705078, 8.038475036621094, 8.366299629211426, 8.694123268127441, 9.021947860717773, 9.349771499633789]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 6.0, 6.0, 15.0, 18.0, 31.0, 58.0, 114.0, 167.0, 343.0, 644.0, 1432.0, 4459.0, 17504.0, 111631.0, 1437781.0, 2371142.0, 214989.0, 24387.0, 5664.0, 2052.0, 843.0, 410.0, 207.0, 132.0, 88.0, 48.0, 31.0, 27.0, 13.0, 7.0, 9.0, 8.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8349609375, -0.806304931640625, -0.77764892578125, -0.748992919921875, -0.7203369140625, -0.691680908203125, -0.66302490234375, -0.634368896484375, -0.605712890625, -0.577056884765625, -0.54840087890625, -0.519744873046875, -0.4910888671875, -0.462432861328125, -0.43377685546875, -0.405120849609375, -0.37646484375, -0.347808837890625, -0.31915283203125, -0.290496826171875, -0.2618408203125, -0.233184814453125, -0.20452880859375, -0.175872802734375, -0.147216796875, -0.118560791015625, -0.08990478515625, -0.061248779296875, -0.0325927734375, -0.003936767578125, 0.02471923828125, 0.053375244140625, 0.08203125, 0.110687255859375, 0.13934326171875, 0.167999267578125, 0.1966552734375, 0.225311279296875, 0.25396728515625, 0.282623291015625, 0.311279296875, 0.339935302734375, 0.36859130859375, 0.397247314453125, 0.4259033203125, 0.454559326171875, 0.48321533203125, 0.511871337890625, 0.54052734375, 0.569183349609375, 0.59783935546875, 0.626495361328125, 0.6551513671875, 0.683807373046875, 0.71246337890625, 0.741119384765625, 0.769775390625, 0.798431396484375, 0.82708740234375, 0.855743408203125, 0.8843994140625, 0.913055419921875, 0.94171142578125, 0.970367431640625, 0.9990234375]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 3.0, 7.0, 12.0, 16.0, 19.0, 35.0, 29.0, 39.0, 48.0, 67.0, 69.0, 64.0, 71.0, 79.0, 79.0, 76.0, 58.0, 65.0, 30.0, 34.0, 26.0, 25.0, 18.0, 10.0, 7.0, 2.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7998046875, -0.76922607421875, -0.7386474609375, -0.70806884765625, -0.677490234375, -0.64691162109375, -0.6163330078125, -0.58575439453125, -0.55517578125, -0.52459716796875, -0.4940185546875, -0.46343994140625, -0.432861328125, -0.40228271484375, -0.3717041015625, -0.34112548828125, -0.310546875, -0.27996826171875, -0.2493896484375, -0.21881103515625, -0.188232421875, -0.15765380859375, -0.1270751953125, -0.09649658203125, -0.06591796875, -0.03533935546875, -0.0047607421875, 0.02581787109375, 0.056396484375, 0.08697509765625, 0.1175537109375, 0.14813232421875, 0.1787109375, 0.20928955078125, 0.2398681640625, 0.27044677734375, 0.301025390625, 0.33160400390625, 0.3621826171875, 0.39276123046875, 0.42333984375, 0.45391845703125, 0.4844970703125, 0.51507568359375, 0.545654296875, 0.57623291015625, 0.6068115234375, 0.63739013671875, 0.66796875, 0.69854736328125, 0.7291259765625, 0.75970458984375, 0.790283203125, 0.82086181640625, 0.8514404296875, 0.88201904296875, 0.91259765625, 0.94317626953125, 0.9737548828125, 1.00433349609375, 1.034912109375, 1.06549072265625, 1.0960693359375, 1.12664794921875, 1.1572265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 3.0, 10.0, 19.0, 34.0, 53.0, 106.0, 188.0, 315.0, 829.0, 3334.0, 26288.0, 1151867.0, 2948753.0, 54294.0, 5791.0, 1290.0, 466.0, 247.0, 153.0, 84.0, 55.0, 36.0, 20.0, 15.0, 7.0, 10.0, 8.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.431640625, -1.3768310546875, -1.322021484375, -1.2672119140625, -1.21240234375, -1.1575927734375, -1.102783203125, -1.0479736328125, -0.9931640625, -0.9383544921875, -0.883544921875, -0.8287353515625, -0.77392578125, -0.7191162109375, -0.664306640625, -0.6094970703125, -0.5546875, -0.4998779296875, -0.445068359375, -0.3902587890625, -0.33544921875, -0.2806396484375, -0.225830078125, -0.1710205078125, -0.1162109375, -0.0614013671875, -0.006591796875, 0.0482177734375, 0.10302734375, 0.1578369140625, 0.212646484375, 0.2674560546875, 0.322265625, 0.3770751953125, 0.431884765625, 0.4866943359375, 0.54150390625, 0.5963134765625, 0.651123046875, 0.7059326171875, 0.7607421875, 0.8155517578125, 0.870361328125, 0.9251708984375, 0.97998046875, 1.0347900390625, 1.089599609375, 1.1444091796875, 1.19921875, 1.2540283203125, 1.308837890625, 1.3636474609375, 1.41845703125, 1.4732666015625, 1.528076171875, 1.5828857421875, 1.6376953125, 1.6925048828125, 1.747314453125, 1.8021240234375, 1.85693359375, 1.9117431640625, 1.966552734375, 2.0213623046875, 2.076171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 2.0, 7.0, 10.0, 15.0, 40.0, 57.0, 90.0, 217.0, 406.0, 700.0, 939.0, 697.0, 413.0, 207.0, 107.0, 54.0, 36.0, 22.0, 20.0, 10.0, 10.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.86328125, -1.8136138916015625, -1.763946533203125, -1.7142791748046875, -1.66461181640625, -1.6149444580078125, -1.565277099609375, -1.5156097412109375, -1.4659423828125, -1.4162750244140625, -1.366607666015625, -1.3169403076171875, -1.26727294921875, -1.2176055908203125, -1.167938232421875, -1.1182708740234375, -1.068603515625, -1.0189361572265625, -0.969268798828125, -0.9196014404296875, -0.86993408203125, -0.8202667236328125, -0.770599365234375, -0.7209320068359375, -0.6712646484375, -0.6215972900390625, -0.571929931640625, -0.5222625732421875, -0.47259521484375, -0.4229278564453125, -0.373260498046875, -0.3235931396484375, -0.27392578125, -0.2242584228515625, -0.174591064453125, -0.1249237060546875, -0.07525634765625, -0.0255889892578125, 0.024078369140625, 0.0737457275390625, 0.1234130859375, 0.1730804443359375, 0.222747802734375, 0.2724151611328125, 0.32208251953125, 0.3717498779296875, 0.421417236328125, 0.4710845947265625, 0.520751953125, 0.5704193115234375, 0.620086669921875, 0.6697540283203125, 0.71942138671875, 0.7690887451171875, 0.818756103515625, 0.8684234619140625, 0.9180908203125, 0.9677581787109375, 1.017425537109375, 1.0670928955078125, 1.11676025390625, 1.1664276123046875, 1.216094970703125, 1.2657623291015625, 1.3154296875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 8.0, 7.0, 27.0, 31.0, 90.0, 151.0, 197.0, 197.0, 119.0, 81.0, 32.0, 25.0, 10.0, 6.0, 5.0, 3.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.263429641723633, -10.882589340209961, -10.501748085021973, -10.1209077835083, -9.740067481994629, -9.35922622680664, -8.978385925292969, -8.597545623779297, -8.216704368591309, -7.8358635902404785, -7.455023288726807, -7.074182510375977, -6.6933417320251465, -6.312500953674316, -5.9316606521606445, -5.5508198738098145, -5.169979572296143, -4.7891387939453125, -4.408298492431641, -4.0274577140808105, -3.6466169357299805, -3.2657763957977295, -2.8849358558654785, -2.5040950775146484, -2.1232545375823975, -1.742413878440857, -1.3615732192993164, -0.9807326793670654, -0.5998920202255249, -0.21905136108398438, 0.1617891788482666, 0.5426299571990967, 0.9234704971313477, 1.3043111562728882, 1.6851518154144287, 2.0659923553466797, 2.4468331336975098, 2.8276736736297607, 3.2085142135620117, 3.589354991912842, 3.9701955318450928, 4.351036071777344, 4.731876850128174, 5.112717628479004, 5.493557929992676, 5.874398708343506, 6.255239486694336, 6.636079788208008, 7.016920566558838, 7.397761344909668, 7.77860164642334, 8.159442901611328, 8.540283203125, 8.921123504638672, 9.301963806152344, 9.682805061340332, 10.063645362854004, 10.444485664367676, 10.825326919555664, 11.206167221069336, 11.587007522583008, 11.967848777770996, 12.348689079284668, 12.729530334472656, 13.110370635986328]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 8.0, 15.0, 10.0, 14.0, 20.0, 28.0, 42.0, 32.0, 21.0, 48.0, 53.0, 49.0, 61.0, 70.0, 70.0, 46.0, 73.0, 60.0, 55.0, 40.0, 36.0, 39.0, 25.0, 18.0, 17.0, 9.0, 10.0, 2.0, 8.0, 6.0, 4.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.208133220672607, -5.00026273727417, -4.792392730712891, -4.584522247314453, -4.376651763916016, -4.168781757354736, -3.960911273956299, -3.7530410289764404, -3.545170783996582, -3.3373005390167236, -3.1294302940368652, -2.9215598106384277, -2.7136895656585693, -2.505819320678711, -2.2979488372802734, -2.090078592300415, -1.8822083473205566, -1.6743381023406982, -1.4664677381515503, -1.2585973739624023, -1.050727128982544, -0.8428568840026855, -0.6349865198135376, -0.42711615562438965, -0.21924591064453125, -0.011375606060028076, 0.1964946985244751, 0.40436500310897827, 0.6122353076934814, 0.8201055526733398, 1.0279759168624878, 1.2358462810516357, 1.443716049194336, 1.6515862941741943, 1.8594566583633423, 2.0673270225524902, 2.2751972675323486, 2.483067512512207, 2.6909379959106445, 2.898808240890503, 3.1066784858703613, 3.3145487308502197, 3.522418975830078, 3.7302894592285156, 3.938159704208374, 4.146029949188232, 4.35390043258667, 4.561770439147949, 4.769640922546387, 4.977511405944824, 5.1853814125061035, 5.393251895904541, 5.60112190246582, 5.808992385864258, 6.016862869262695, 6.224733352661133, 6.432603359222412, 6.64047384262085, 6.848343849182129, 7.056214332580566, 7.264084815979004, 7.471954822540283, 7.679825305938721, 7.8876953125, 8.095565795898438]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 9.0, 6.0, 12.0, 9.0, 16.0, 28.0, 35.0, 50.0, 102.0, 214.0, 375.0, 651.0, 1191.0, 2428.0, 5190.0, 13292.0, 37290.0, 119430.0, 390531.0, 330708.0, 95927.0, 30840.0, 11100.0, 4555.0, 2157.0, 1082.0, 535.0, 311.0, 189.0, 105.0, 75.0, 40.0, 29.0, 10.0, 11.0, 3.0, 8.0, 6.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.962890625, -0.9327163696289062, -0.9025421142578125, -0.8723678588867188, -0.842193603515625, -0.8120193481445312, -0.7818450927734375, -0.7516708374023438, -0.72149658203125, -0.6913223266601562, -0.6611480712890625, -0.6309738159179688, -0.600799560546875, -0.5706253051757812, -0.5404510498046875, -0.5102767944335938, -0.4801025390625, -0.44992828369140625, -0.4197540283203125, -0.38957977294921875, -0.359405517578125, -0.32923126220703125, -0.2990570068359375, -0.26888275146484375, -0.23870849609375, -0.20853424072265625, -0.1783599853515625, -0.14818572998046875, -0.118011474609375, -0.08783721923828125, -0.0576629638671875, -0.02748870849609375, 0.002685546875, 0.03285980224609375, 0.0630340576171875, 0.09320831298828125, 0.123382568359375, 0.15355682373046875, 0.1837310791015625, 0.21390533447265625, 0.24407958984375, 0.27425384521484375, 0.3044281005859375, 0.33460235595703125, 0.364776611328125, 0.39495086669921875, 0.4251251220703125, 0.45529937744140625, 0.4854736328125, 0.5156478881835938, 0.5458221435546875, 0.5759963989257812, 0.606170654296875, 0.6363449096679688, 0.6665191650390625, 0.6966934204101562, 0.72686767578125, 0.7570419311523438, 0.7872161865234375, 0.8173904418945312, 0.847564697265625, 0.8777389526367188, 0.9079132080078125, 0.9380874633789062, 0.96826171875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 6.0, 7.0, 12.0, 13.0, 25.0, 24.0, 33.0, 52.0, 47.0, 44.0, 66.0, 67.0, 79.0, 77.0, 71.0, 82.0, 62.0, 64.0, 30.0, 36.0, 25.0, 23.0, 17.0, 11.0, 7.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7529296875, -0.7230072021484375, -0.693084716796875, -0.6631622314453125, -0.63323974609375, -0.6033172607421875, -0.573394775390625, -0.5434722900390625, -0.5135498046875, -0.4836273193359375, -0.453704833984375, -0.4237823486328125, -0.39385986328125, -0.3639373779296875, -0.334014892578125, -0.3040924072265625, -0.274169921875, -0.2442474365234375, -0.214324951171875, -0.1844024658203125, -0.15447998046875, -0.1245574951171875, -0.094635009765625, -0.0647125244140625, -0.0347900390625, -0.0048675537109375, 0.025054931640625, 0.0549774169921875, 0.08489990234375, 0.1148223876953125, 0.144744873046875, 0.1746673583984375, 0.20458984375, 0.2345123291015625, 0.264434814453125, 0.2943572998046875, 0.32427978515625, 0.3542022705078125, 0.384124755859375, 0.4140472412109375, 0.4439697265625, 0.4738922119140625, 0.503814697265625, 0.5337371826171875, 0.56365966796875, 0.5935821533203125, 0.623504638671875, 0.6534271240234375, 0.683349609375, 0.7132720947265625, 0.743194580078125, 0.7731170654296875, 0.80303955078125, 0.8329620361328125, 0.862884521484375, 0.8928070068359375, 0.9227294921875, 0.9526519775390625, 0.982574462890625, 1.0124969482421875, 1.04241943359375, 1.0723419189453125, 1.102264404296875, 1.1321868896484375, 1.162109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 8.0, 13.0, 9.0, 18.0, 36.0, 26.0, 81.0, 119.0, 244.0, 403.0, 770.0, 1733.0, 5437.0, 34689.0, 709738.0, 269732.0, 19025.0, 3699.0, 1313.0, 661.0, 322.0, 202.0, 118.0, 66.0, 38.0, 24.0, 19.0, 10.0, 7.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6640625, -2.58538818359375, -2.5067138671875, -2.42803955078125, -2.349365234375, -2.27069091796875, -2.1920166015625, -2.11334228515625, -2.03466796875, -1.95599365234375, -1.8773193359375, -1.79864501953125, -1.719970703125, -1.64129638671875, -1.5626220703125, -1.48394775390625, -1.4052734375, -1.32659912109375, -1.2479248046875, -1.16925048828125, -1.090576171875, -1.01190185546875, -0.9332275390625, -0.85455322265625, -0.77587890625, -0.69720458984375, -0.6185302734375, -0.53985595703125, -0.461181640625, -0.38250732421875, -0.3038330078125, -0.22515869140625, -0.146484375, -0.06781005859375, 0.0108642578125, 0.08953857421875, 0.168212890625, 0.24688720703125, 0.3255615234375, 0.40423583984375, 0.48291015625, 0.56158447265625, 0.6402587890625, 0.71893310546875, 0.797607421875, 0.87628173828125, 0.9549560546875, 1.03363037109375, 1.1123046875, 1.19097900390625, 1.2696533203125, 1.34832763671875, 1.427001953125, 1.50567626953125, 1.5843505859375, 1.66302490234375, 1.74169921875, 1.82037353515625, 1.8990478515625, 1.97772216796875, 2.056396484375, 2.13507080078125, 2.2137451171875, 2.29241943359375, 2.37109375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 3.0, 7.0, 9.0, 10.0, 8.0, 13.0, 12.0, 22.0, 24.0, 26.0, 22.0, 41.0, 45.0, 54.0, 55.0, 50.0, 40.0, 39.0, 60.0, 46.0, 46.0, 47.0, 50.0, 34.0, 28.0, 28.0, 30.0, 30.0, 27.0, 17.0, 19.0, 10.0, 5.0, 6.0, 5.0, 6.0, 2.0, 1.0, 1.0, 6.0, 4.0], "bins": [-3.458984375, -3.3751373291015625, -3.291290283203125, -3.2074432373046875, -3.12359619140625, -3.0397491455078125, -2.955902099609375, -2.8720550537109375, -2.7882080078125, -2.7043609619140625, -2.620513916015625, -2.5366668701171875, -2.45281982421875, -2.3689727783203125, -2.285125732421875, -2.2012786865234375, -2.117431640625, -2.0335845947265625, -1.949737548828125, -1.8658905029296875, -1.78204345703125, -1.6981964111328125, -1.614349365234375, -1.5305023193359375, -1.4466552734375, -1.3628082275390625, -1.278961181640625, -1.1951141357421875, -1.11126708984375, -1.0274200439453125, -0.943572998046875, -0.8597259521484375, -0.77587890625, -0.6920318603515625, -0.608184814453125, -0.5243377685546875, -0.44049072265625, -0.3566436767578125, -0.272796630859375, -0.1889495849609375, -0.1051025390625, -0.0212554931640625, 0.062591552734375, 0.1464385986328125, 0.23028564453125, 0.3141326904296875, 0.397979736328125, 0.4818267822265625, 0.565673828125, 0.6495208740234375, 0.733367919921875, 0.8172149658203125, 0.90106201171875, 0.9849090576171875, 1.068756103515625, 1.1526031494140625, 1.2364501953125, 1.3202972412109375, 1.404144287109375, 1.4879913330078125, 1.57183837890625, 1.6556854248046875, 1.739532470703125, 1.8233795166015625, 1.9072265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 8.0, 3.0, 7.0, 13.0, 13.0, 19.0, 24.0, 38.0, 37.0, 72.0, 111.0, 176.0, 279.0, 479.0, 881.0, 1798.0, 3989.0, 10116.0, 30026.0, 113803.0, 700528.0, 133044.0, 33567.0, 11078.0, 4227.0, 1881.0, 920.0, 516.0, 274.0, 191.0, 121.0, 92.0, 52.0, 46.0, 41.0, 26.0, 21.0, 14.0, 10.0, 4.0, 4.0, 5.0, 1.0, 3.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.564453125, -0.5423583984375, -0.520263671875, -0.4981689453125, -0.47607421875, -0.4539794921875, -0.431884765625, -0.4097900390625, -0.3876953125, -0.3656005859375, -0.343505859375, -0.3214111328125, -0.29931640625, -0.2772216796875, -0.255126953125, -0.2330322265625, -0.2109375, -0.1888427734375, -0.166748046875, -0.1446533203125, -0.12255859375, -0.1004638671875, -0.078369140625, -0.0562744140625, -0.0341796875, -0.0120849609375, 0.010009765625, 0.0321044921875, 0.05419921875, 0.0762939453125, 0.098388671875, 0.1204833984375, 0.142578125, 0.1646728515625, 0.186767578125, 0.2088623046875, 0.23095703125, 0.2530517578125, 0.275146484375, 0.2972412109375, 0.3193359375, 0.3414306640625, 0.363525390625, 0.3856201171875, 0.40771484375, 0.4298095703125, 0.451904296875, 0.4739990234375, 0.49609375, 0.5181884765625, 0.540283203125, 0.5623779296875, 0.58447265625, 0.6065673828125, 0.628662109375, 0.6507568359375, 0.6728515625, 0.6949462890625, 0.717041015625, 0.7391357421875, 0.76123046875, 0.7833251953125, 0.805419921875, 0.8275146484375, 0.849609375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 7.0, 8.0, 12.0, 7.0, 13.0, 25.0, 31.0, 46.0, 62.0, 120.0, 237.0, 160.0, 93.0, 41.0, 30.0, 18.0, 23.0, 15.0, 19.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0003972053527832031, -0.0003872048109769821, -0.0003772042691707611, -0.0003672037273645401, -0.0003572031855583191, -0.0003472026437520981, -0.0003372021019458771, -0.00032720156013965607, -0.00031720101833343506, -0.00030720047652721405, -0.00029719993472099304, -0.00028719939291477203, -0.000277198851108551, -0.00026719830930233, -0.000257197767496109, -0.000247197225689888, -0.000237196683883667, -0.00022719614207744598, -0.00021719560027122498, -0.00020719505846500397, -0.00019719451665878296, -0.00018719397485256195, -0.00017719343304634094, -0.00016719289124011993, -0.00015719234943389893, -0.00014719180762767792, -0.0001371912658214569, -0.0001271907240152359, -0.00011719018220901489, -0.00010718964040279388, -9.718909859657288e-05, -8.718855679035187e-05, -7.718801498413086e-05, -6.718747317790985e-05, -5.718693137168884e-05, -4.7186389565467834e-05, -3.7185847759246826e-05, -2.7185305953025818e-05, -1.718476414680481e-05, -7.184222340583801e-06, 2.816319465637207e-06, 1.2816861271858215e-05, 2.2817403078079224e-05, 3.281794488430023e-05, 4.281848669052124e-05, 5.281902849674225e-05, 6.281957030296326e-05, 7.282011210918427e-05, 8.282065391540527e-05, 9.282119572162628e-05, 0.00010282173752784729, 0.0001128222793340683, 0.0001228228211402893, 0.00013282336294651031, 0.00014282390475273132, 0.00015282444655895233, 0.00016282498836517334, 0.00017282553017139435, 0.00018282607197761536, 0.00019282661378383636, 0.00020282715559005737, 0.00021282769739627838, 0.0002228282392024994, 0.0002328287810087204, 0.0002428293228149414]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 2.0, 2.0, 11.0, 14.0, 12.0, 29.0, 33.0, 67.0, 106.0, 170.0, 234.0, 416.0, 688.0, 1292.0, 2868.0, 7342.0, 23690.0, 89445.0, 675390.0, 186686.0, 40170.0, 11847.0, 4062.0, 1753.0, 849.0, 516.0, 305.0, 206.0, 119.0, 80.0, 42.0, 42.0, 19.0, 16.0, 14.0, 5.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6181640625, -0.595855712890625, -0.57354736328125, -0.551239013671875, -0.5289306640625, -0.506622314453125, -0.48431396484375, -0.462005615234375, -0.439697265625, -0.417388916015625, -0.39508056640625, -0.372772216796875, -0.3504638671875, -0.328155517578125, -0.30584716796875, -0.283538818359375, -0.26123046875, -0.238922119140625, -0.21661376953125, -0.194305419921875, -0.1719970703125, -0.149688720703125, -0.12738037109375, -0.105072021484375, -0.082763671875, -0.060455322265625, -0.03814697265625, -0.015838623046875, 0.0064697265625, 0.028778076171875, 0.05108642578125, 0.073394775390625, 0.095703125, 0.118011474609375, 0.14031982421875, 0.162628173828125, 0.1849365234375, 0.207244873046875, 0.22955322265625, 0.251861572265625, 0.274169921875, 0.296478271484375, 0.31878662109375, 0.341094970703125, 0.3634033203125, 0.385711669921875, 0.40802001953125, 0.430328369140625, 0.45263671875, 0.474945068359375, 0.49725341796875, 0.519561767578125, 0.5418701171875, 0.564178466796875, 0.58648681640625, 0.608795166015625, 0.631103515625, 0.653411865234375, 0.67572021484375, 0.698028564453125, 0.7203369140625, 0.742645263671875, 0.76495361328125, 0.787261962890625, 0.8095703125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 4.0, 4.0, 7.0, 10.0, 9.0, 11.0, 8.0, 15.0, 14.0, 16.0, 20.0, 37.0, 52.0, 48.0, 64.0, 85.0, 105.0, 110.0, 86.0, 72.0, 36.0, 35.0, 30.0, 25.0, 15.0, 15.0, 11.0, 11.0, 11.0, 4.0, 5.0, 6.0, 8.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.79345703125, -0.7712860107421875, -0.749114990234375, -0.7269439697265625, -0.70477294921875, -0.6826019287109375, -0.660430908203125, -0.6382598876953125, -0.6160888671875, -0.5939178466796875, -0.571746826171875, -0.5495758056640625, -0.52740478515625, -0.5052337646484375, -0.483062744140625, -0.4608917236328125, -0.438720703125, -0.4165496826171875, -0.394378662109375, -0.3722076416015625, -0.35003662109375, -0.3278656005859375, -0.305694580078125, -0.2835235595703125, -0.2613525390625, -0.2391815185546875, -0.217010498046875, -0.1948394775390625, -0.17266845703125, -0.1504974365234375, -0.128326416015625, -0.1061553955078125, -0.083984375, -0.0618133544921875, -0.039642333984375, -0.0174713134765625, 0.00469970703125, 0.0268707275390625, 0.049041748046875, 0.0712127685546875, 0.0933837890625, 0.1155548095703125, 0.137725830078125, 0.1598968505859375, 0.18206787109375, 0.2042388916015625, 0.226409912109375, 0.2485809326171875, 0.270751953125, 0.2929229736328125, 0.315093994140625, 0.3372650146484375, 0.35943603515625, 0.3816070556640625, 0.403778076171875, 0.4259490966796875, 0.4481201171875, 0.4702911376953125, 0.492462158203125, 0.5146331787109375, 0.53680419921875, 0.5589752197265625, 0.581146240234375, 0.6033172607421875, 0.62548828125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 6.0, 13.0, 32.0, 62.0, 149.0, 279.0, 216.0, 102.0, 62.0, 22.0, 11.0, 11.0, 9.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.805953979492188, -15.294174194335938, -14.782393455505371, -14.270613670349121, -13.758832931518555, -13.247053146362305, -12.735273361206055, -12.223492622375488, -11.711711883544922, -11.199932098388672, -10.688151359558105, -10.176371574401855, -9.664590835571289, -9.152811050415039, -8.641031265258789, -8.129250526428223, -7.617470741271973, -7.1056904792785645, -6.593910217285156, -6.082130432128906, -5.57034969329834, -5.05856990814209, -4.546789646148682, -4.035009384155273, -3.5232291221618652, -3.011448860168457, -2.499668598175049, -1.9878885746002197, -1.4761083126068115, -0.9643280506134033, -0.4525480270385742, 0.059232234954833984, 0.5710124969482422, 1.0827927589416504, 1.594572901725769, 2.1063530445098877, 2.618133306503296, 3.129913568496704, 3.641693592071533, 4.153473854064941, 4.66525411605835, 5.177034378051758, 5.688814640045166, 6.200594902038574, 6.712374687194824, 7.224155426025391, 7.735935211181641, 8.24771499633789, 8.759495735168457, 9.271275520324707, 9.783056259155273, 10.294836044311523, 10.80661678314209, 11.31839656829834, 11.830177307128906, 12.341957092285156, 12.853736877441406, 13.365516662597656, 13.877297401428223, 14.389077186584473, 14.900857925415039, 15.412637710571289, 15.924417495727539, 16.436199188232422, 16.947978973388672]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 9.0, 9.0, 13.0, 21.0, 18.0, 20.0, 15.0, 18.0, 31.0, 36.0, 39.0, 33.0, 48.0, 59.0, 69.0, 74.0, 73.0, 54.0, 46.0, 31.0, 34.0, 46.0, 23.0, 26.0, 21.0, 17.0, 18.0, 16.0, 11.0, 15.0, 11.0, 10.0, 6.0, 4.0, 4.0, 1.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.99305248260498, -10.655808448791504, -10.318565368652344, -9.981321334838867, -9.64407730102539, -9.30683422088623, -8.969590187072754, -8.632347106933594, -8.295103073120117, -7.957859516143799, -7.6206159591674805, -7.283371925354004, -6.9461283683776855, -6.608884811401367, -6.271640777587891, -5.934397220611572, -5.597153663635254, -5.2599101066589355, -4.922666549682617, -4.585422515869141, -4.248178958892822, -3.910935401916504, -3.5736916065216064, -3.236447811126709, -2.8992042541503906, -2.5619606971740723, -2.224716901779175, -1.887473225593567, -1.550229549407959, -1.212985873222351, -0.8757421970367432, -0.5384984016418457, -0.20125579833984375, 0.13598787784576416, 0.47323155403137207, 0.81047523021698, 1.147718906402588, 1.4849625825881958, 1.8222062587738037, 2.159450054168701, 2.4966936111450195, 2.833937168121338, 3.1711809635162354, 3.508424758911133, 3.845668315887451, 4.1829118728637695, 4.520155906677246, 4.8573994636535645, 5.194643020629883, 5.531886577606201, 5.8691301345825195, 6.206374168395996, 6.5436177253723145, 6.880861282348633, 7.218105316162109, 7.555348873138428, 7.892592430114746, 8.229836463928223, 8.567079544067383, 8.90432357788086, 9.241567611694336, 9.578810691833496, 9.916054725646973, 10.253297805786133, 10.59054183959961]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 10.0, 9.0, 24.0, 28.0, 59.0, 102.0, 166.0, 333.0, 714.0, 1752.0, 5980.0, 28833.0, 358811.0, 3258574.0, 499918.0, 30250.0, 5448.0, 1699.0, 746.0, 397.0, 162.0, 98.0, 55.0, 41.0, 25.0, 12.0, 8.0, 7.0, 8.0, 7.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.2197265625, -1.1833648681640625, -1.147003173828125, -1.1106414794921875, -1.07427978515625, -1.0379180908203125, -1.001556396484375, -0.9651947021484375, -0.9288330078125, -0.8924713134765625, -0.856109619140625, -0.8197479248046875, -0.78338623046875, -0.7470245361328125, -0.710662841796875, -0.6743011474609375, -0.637939453125, -0.6015777587890625, -0.565216064453125, -0.5288543701171875, -0.49249267578125, -0.4561309814453125, -0.419769287109375, -0.3834075927734375, -0.3470458984375, -0.3106842041015625, -0.274322509765625, -0.2379608154296875, -0.20159912109375, -0.1652374267578125, -0.128875732421875, -0.0925140380859375, -0.05615234375, -0.0197906494140625, 0.016571044921875, 0.0529327392578125, 0.08929443359375, 0.1256561279296875, 0.162017822265625, 0.1983795166015625, 0.2347412109375, 0.2711029052734375, 0.307464599609375, 0.3438262939453125, 0.38018798828125, 0.4165496826171875, 0.452911376953125, 0.4892730712890625, 0.525634765625, 0.5619964599609375, 0.598358154296875, 0.6347198486328125, 0.67108154296875, 0.7074432373046875, 0.743804931640625, 0.7801666259765625, 0.8165283203125, 0.8528900146484375, 0.889251708984375, 0.9256134033203125, 0.96197509765625, 0.9983367919921875, 1.034698486328125, 1.0710601806640625, 1.107421875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 9.0, 21.0, 23.0, 27.0, 27.0, 52.0, 47.0, 60.0, 61.0, 81.0, 82.0, 84.0, 95.0, 60.0, 68.0, 38.0, 45.0, 34.0, 20.0, 17.0, 18.0, 12.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78515625, -0.7537994384765625, -0.722442626953125, -0.6910858154296875, -0.65972900390625, -0.6283721923828125, -0.597015380859375, -0.5656585693359375, -0.5343017578125, -0.5029449462890625, -0.471588134765625, -0.4402313232421875, -0.40887451171875, -0.3775177001953125, -0.346160888671875, -0.3148040771484375, -0.283447265625, -0.2520904541015625, -0.220733642578125, -0.1893768310546875, -0.15802001953125, -0.1266632080078125, -0.095306396484375, -0.0639495849609375, -0.0325927734375, -0.0012359619140625, 0.030120849609375, 0.0614776611328125, 0.09283447265625, 0.1241912841796875, 0.155548095703125, 0.1869049072265625, 0.21826171875, 0.2496185302734375, 0.280975341796875, 0.3123321533203125, 0.34368896484375, 0.3750457763671875, 0.406402587890625, 0.4377593994140625, 0.4691162109375, 0.5004730224609375, 0.531829833984375, 0.5631866455078125, 0.59454345703125, 0.6259002685546875, 0.657257080078125, 0.6886138916015625, 0.719970703125, 0.7513275146484375, 0.782684326171875, 0.8140411376953125, 0.84539794921875, 0.8767547607421875, 0.908111572265625, 0.9394683837890625, 0.9708251953125, 1.0021820068359375, 1.033538818359375, 1.0648956298828125, 1.09625244140625, 1.1276092529296875, 1.158966064453125, 1.1903228759765625, 1.2216796875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 8.0, 12.0, 13.0, 22.0, 33.0, 48.0, 59.0, 75.0, 131.0, 167.0, 297.0, 497.0, 889.0, 1836.0, 5865.0, 39686.0, 2774094.0, 1338687.0, 24851.0, 4013.0, 1334.0, 585.0, 334.0, 210.0, 156.0, 101.0, 71.0, 52.0, 40.0, 21.0, 20.0, 19.0, 17.0, 6.0, 8.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6435546875, -1.5825042724609375, -1.521453857421875, -1.4604034423828125, -1.39935302734375, -1.3383026123046875, -1.277252197265625, -1.2162017822265625, -1.1551513671875, -1.0941009521484375, -1.033050537109375, -0.9720001220703125, -0.91094970703125, -0.8498992919921875, -0.788848876953125, -0.7277984619140625, -0.666748046875, -0.6056976318359375, -0.544647216796875, -0.4835968017578125, -0.42254638671875, -0.3614959716796875, -0.300445556640625, -0.2393951416015625, -0.1783447265625, -0.1172943115234375, -0.056243896484375, 0.0048065185546875, 0.06585693359375, 0.1269073486328125, 0.187957763671875, 0.2490081787109375, 0.31005859375, 0.3711090087890625, 0.432159423828125, 0.4932098388671875, 0.55426025390625, 0.6153106689453125, 0.676361083984375, 0.7374114990234375, 0.7984619140625, 0.8595123291015625, 0.920562744140625, 0.9816131591796875, 1.04266357421875, 1.1037139892578125, 1.164764404296875, 1.2258148193359375, 1.286865234375, 1.3479156494140625, 1.408966064453125, 1.4700164794921875, 1.53106689453125, 1.5921173095703125, 1.653167724609375, 1.7142181396484375, 1.7752685546875, 1.8363189697265625, 1.897369384765625, 1.9584197998046875, 2.01947021484375, 2.0805206298828125, 2.141571044921875, 2.2026214599609375, 2.263671875]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 6.0, 0.0, 4.0, 5.0, 8.0, 9.0, 9.0, 24.0, 33.0, 73.0, 156.0, 346.0, 738.0, 1105.0, 826.0, 401.0, 168.0, 67.0, 36.0, 22.0, 20.0, 9.0, 7.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.216796875, -2.157989501953125, -2.09918212890625, -2.040374755859375, -1.9815673828125, -1.922760009765625, -1.86395263671875, -1.805145263671875, -1.746337890625, -1.687530517578125, -1.62872314453125, -1.569915771484375, -1.5111083984375, -1.452301025390625, -1.39349365234375, -1.334686279296875, -1.27587890625, -1.217071533203125, -1.15826416015625, -1.099456787109375, -1.0406494140625, -0.981842041015625, -0.92303466796875, -0.864227294921875, -0.805419921875, -0.746612548828125, -0.68780517578125, -0.628997802734375, -0.5701904296875, -0.511383056640625, -0.45257568359375, -0.393768310546875, -0.3349609375, -0.276153564453125, -0.21734619140625, -0.158538818359375, -0.0997314453125, -0.040924072265625, 0.01788330078125, 0.076690673828125, 0.135498046875, 0.194305419921875, 0.25311279296875, 0.311920166015625, 0.3707275390625, 0.429534912109375, 0.48834228515625, 0.547149658203125, 0.60595703125, 0.664764404296875, 0.72357177734375, 0.782379150390625, 0.8411865234375, 0.899993896484375, 0.95880126953125, 1.017608642578125, 1.076416015625, 1.135223388671875, 1.19403076171875, 1.252838134765625, 1.3116455078125, 1.370452880859375, 1.42926025390625, 1.488067626953125, 1.546875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 4.0, 7.0, 4.0, 6.0, 5.0, 18.0, 35.0, 104.0, 241.0, 301.0, 175.0, 71.0, 21.0, 8.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.064496994018555, -21.40431022644043, -20.744121551513672, -20.083934783935547, -19.423748016357422, -18.763561248779297, -18.103374481201172, -17.443185806274414, -16.78299903869629, -16.122812271118164, -15.462624549865723, -14.802436828613281, -14.142250061035156, -13.482063293457031, -12.82187557220459, -12.161687850952148, -11.501501083374023, -10.841314315795898, -10.181126594543457, -9.520938873291016, -8.86075210571289, -8.200565338134766, -7.540377616882324, -6.880190372467041, -6.220003128051758, -5.559815883636475, -4.899628639221191, -4.239441394805908, -3.579254150390625, -2.919066905975342, -2.2588796615600586, -1.5986924171447754, -0.9385032653808594, -0.27831602096557617, 0.38187122344970703, 1.0420584678649902, 1.7022457122802734, 2.3624329566955566, 3.02262020111084, 3.682807445526123, 4.342994689941406, 5.0031819343566895, 5.663369178771973, 6.323556423187256, 6.983743667602539, 7.643930912017822, 8.304118156433105, 8.964305877685547, 9.624492645263672, 10.284679412841797, 10.944867134094238, 11.60505485534668, 12.265241622924805, 12.92542839050293, 13.585616111755371, 14.245803833007812, 14.905990600585938, 15.566177368164062, 16.226364135742188, 16.886552810668945, 17.54673957824707, 18.206926345825195, 18.867115020751953, 19.527301788330078, 20.187488555908203]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 5.0, 9.0, 7.0, 15.0, 14.0, 21.0, 22.0, 22.0, 44.0, 52.0, 43.0, 66.0, 76.0, 76.0, 65.0, 68.0, 81.0, 65.0, 42.0, 55.0, 40.0, 29.0, 16.0, 25.0, 13.0, 17.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.052654266357422, -7.7853851318359375, -7.518115520477295, -7.2508463859558105, -6.983576774597168, -6.716307640075684, -6.449038505554199, -6.181769371032715, -5.914499759674072, -5.647230625152588, -5.379961013793945, -5.112691879272461, -4.845422744750977, -4.578153133392334, -4.31088399887085, -4.043614387512207, -3.7763452529907227, -3.509075880050659, -3.2418065071105957, -2.9745373725891113, -2.707267999649048, -2.4399986267089844, -2.1727294921875, -1.9054601192474365, -1.638190746307373, -1.3709213733673096, -1.1036521196365356, -0.8363828063011169, -0.5691134929656982, -0.30184412002563477, -0.03457486629486084, 0.23269438743591309, 0.49996471405029297, 0.7672340273857117, 1.0345033407211304, 1.3017725944519043, 1.5690419673919678, 1.8363113403320312, 2.1035804748535156, 2.370849847793579, 2.6381192207336426, 2.905388593673706, 3.1726579666137695, 3.439927101135254, 3.7071964740753174, 3.974465847015381, 4.241734981536865, 4.509004592895508, 4.776273727416992, 5.043542861938477, 5.310812473297119, 5.5780816078186035, 5.845351219177246, 6.1126203536987305, 6.379889488220215, 6.647158622741699, 6.914428234100342, 7.181697368621826, 7.448966979980469, 7.716236114501953, 7.9835052490234375, 8.250774383544922, 8.518044471740723, 8.785313606262207, 9.052582740783691]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 5.0, 3.0, 9.0, 11.0, 17.0, 24.0, 52.0, 60.0, 140.0, 232.0, 515.0, 1241.0, 3240.0, 10103.0, 45414.0, 273963.0, 552340.0, 127942.0, 23407.0, 6072.0, 2057.0, 859.0, 387.0, 201.0, 103.0, 57.0, 34.0, 22.0, 20.0, 11.0, 6.0, 1.0, 2.0, 5.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.208984375, -1.17034912109375, -1.1317138671875, -1.09307861328125, -1.054443359375, -1.01580810546875, -0.9771728515625, -0.93853759765625, -0.89990234375, -0.86126708984375, -0.8226318359375, -0.78399658203125, -0.745361328125, -0.70672607421875, -0.6680908203125, -0.62945556640625, -0.5908203125, -0.55218505859375, -0.5135498046875, -0.47491455078125, -0.436279296875, -0.39764404296875, -0.3590087890625, -0.32037353515625, -0.28173828125, -0.24310302734375, -0.2044677734375, -0.16583251953125, -0.127197265625, -0.08856201171875, -0.0499267578125, -0.01129150390625, 0.02734375, 0.06597900390625, 0.1046142578125, 0.14324951171875, 0.181884765625, 0.22052001953125, 0.2591552734375, 0.29779052734375, 0.33642578125, 0.37506103515625, 0.4136962890625, 0.45233154296875, 0.490966796875, 0.52960205078125, 0.5682373046875, 0.60687255859375, 0.6455078125, 0.68414306640625, 0.7227783203125, 0.76141357421875, 0.800048828125, 0.83868408203125, 0.8773193359375, 0.91595458984375, 0.95458984375, 0.99322509765625, 1.0318603515625, 1.07049560546875, 1.109130859375, 1.14776611328125, 1.1864013671875, 1.22503662109375, 1.263671875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 6.0, 10.0, 12.0, 21.0, 22.0, 32.0, 38.0, 58.0, 45.0, 75.0, 77.0, 77.0, 76.0, 74.0, 72.0, 55.0, 62.0, 50.0, 40.0, 25.0, 18.0, 17.0, 14.0, 10.0, 9.0, 5.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.84130859375, -0.8095626831054688, -0.7778167724609375, -0.7460708618164062, -0.714324951171875, -0.6825790405273438, -0.6508331298828125, -0.6190872192382812, -0.58734130859375, -0.5555953979492188, -0.5238494873046875, -0.49210357666015625, -0.460357666015625, -0.42861175537109375, -0.3968658447265625, -0.36511993408203125, -0.3333740234375, -0.30162811279296875, -0.2698822021484375, -0.23813629150390625, -0.206390380859375, -0.17464447021484375, -0.1428985595703125, -0.11115264892578125, -0.07940673828125, -0.04766082763671875, -0.0159149169921875, 0.01583099365234375, 0.047576904296875, 0.07932281494140625, 0.1110687255859375, 0.14281463623046875, 0.174560546875, 0.20630645751953125, 0.2380523681640625, 0.26979827880859375, 0.301544189453125, 0.33329010009765625, 0.3650360107421875, 0.39678192138671875, 0.42852783203125, 0.46027374267578125, 0.4920196533203125, 0.5237655639648438, 0.555511474609375, 0.5872573852539062, 0.6190032958984375, 0.6507492065429688, 0.6824951171875, 0.7142410278320312, 0.7459869384765625, 0.7777328491210938, 0.809478759765625, 0.8412246704101562, 0.8729705810546875, 0.9047164916992188, 0.93646240234375, 0.9682083129882812, 0.9999542236328125, 1.0317001342773438, 1.063446044921875, 1.0951919555664062, 1.1269378662109375, 1.1586837768554688, 1.1904296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 5.0, 3.0, 4.0, 2.0, 6.0, 8.0, 17.0, 22.0, 26.0, 28.0, 45.0, 81.0, 157.0, 270.0, 687.0, 1860.0, 6687.0, 36185.0, 336736.0, 603699.0, 49792.0, 8536.0, 2204.0, 763.0, 331.0, 151.0, 89.0, 53.0, 39.0, 23.0, 13.0, 9.0, 10.0, 8.0, 6.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.619140625, -1.56866455078125, -1.5181884765625, -1.46771240234375, -1.417236328125, -1.36676025390625, -1.3162841796875, -1.26580810546875, -1.21533203125, -1.16485595703125, -1.1143798828125, -1.06390380859375, -1.013427734375, -0.96295166015625, -0.9124755859375, -0.86199951171875, -0.8115234375, -0.76104736328125, -0.7105712890625, -0.66009521484375, -0.609619140625, -0.55914306640625, -0.5086669921875, -0.45819091796875, -0.40771484375, -0.35723876953125, -0.3067626953125, -0.25628662109375, -0.205810546875, -0.15533447265625, -0.1048583984375, -0.05438232421875, -0.00390625, 0.04656982421875, 0.0970458984375, 0.14752197265625, 0.197998046875, 0.24847412109375, 0.2989501953125, 0.34942626953125, 0.39990234375, 0.45037841796875, 0.5008544921875, 0.55133056640625, 0.601806640625, 0.65228271484375, 0.7027587890625, 0.75323486328125, 0.8037109375, 0.85418701171875, 0.9046630859375, 0.95513916015625, 1.005615234375, 1.05609130859375, 1.1065673828125, 1.15704345703125, 1.20751953125, 1.25799560546875, 1.3084716796875, 1.35894775390625, 1.409423828125, 1.45989990234375, 1.5103759765625, 1.56085205078125, 1.611328125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 4.0, 3.0, 7.0, 10.0, 12.0, 13.0, 18.0, 24.0, 32.0, 28.0, 30.0, 25.0, 41.0, 42.0, 51.0, 59.0, 58.0, 48.0, 55.0, 49.0, 45.0, 47.0, 48.0, 34.0, 39.0, 39.0, 20.0, 28.0, 21.0, 11.0, 12.0, 9.0, 13.0, 5.0, 3.0, 6.0, 1.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.43359375, -2.35272216796875, -2.2718505859375, -2.19097900390625, -2.110107421875, -2.02923583984375, -1.9483642578125, -1.86749267578125, -1.78662109375, -1.70574951171875, -1.6248779296875, -1.54400634765625, -1.463134765625, -1.38226318359375, -1.3013916015625, -1.22052001953125, -1.1396484375, -1.05877685546875, -0.9779052734375, -0.89703369140625, -0.816162109375, -0.73529052734375, -0.6544189453125, -0.57354736328125, -0.49267578125, -0.41180419921875, -0.3309326171875, -0.25006103515625, -0.169189453125, -0.08831787109375, -0.0074462890625, 0.07342529296875, 0.154296875, 0.23516845703125, 0.3160400390625, 0.39691162109375, 0.477783203125, 0.55865478515625, 0.6395263671875, 0.72039794921875, 0.80126953125, 0.88214111328125, 0.9630126953125, 1.04388427734375, 1.124755859375, 1.20562744140625, 1.2864990234375, 1.36737060546875, 1.4482421875, 1.52911376953125, 1.6099853515625, 1.69085693359375, 1.771728515625, 1.85260009765625, 1.9334716796875, 2.01434326171875, 2.09521484375, 2.17608642578125, 2.2569580078125, 2.33782958984375, 2.418701171875, 2.49957275390625, 2.5804443359375, 2.66131591796875, 2.7421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 7.0, 4.0, 11.0, 15.0, 19.0, 30.0, 34.0, 73.0, 97.0, 138.0, 220.0, 347.0, 534.0, 918.0, 1509.0, 2508.0, 4683.0, 9777.0, 23953.0, 73251.0, 328913.0, 478452.0, 76805.0, 24704.0, 10114.0, 4816.0, 2570.0, 1542.0, 853.0, 525.0, 353.0, 250.0, 144.0, 123.0, 84.0, 55.0, 38.0, 24.0, 12.0, 17.0, 9.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4404296875, -0.42748260498046875, -0.4145355224609375, -0.40158843994140625, -0.388641357421875, -0.37569427490234375, -0.3627471923828125, -0.34980010986328125, -0.33685302734375, -0.32390594482421875, -0.3109588623046875, -0.29801177978515625, -0.285064697265625, -0.27211761474609375, -0.2591705322265625, -0.24622344970703125, -0.2332763671875, -0.22032928466796875, -0.2073822021484375, -0.19443511962890625, -0.181488037109375, -0.16854095458984375, -0.1555938720703125, -0.14264678955078125, -0.12969970703125, -0.11675262451171875, -0.1038055419921875, -0.09085845947265625, -0.077911376953125, -0.06496429443359375, -0.0520172119140625, -0.03907012939453125, -0.026123046875, -0.01317596435546875, -0.0002288818359375, 0.01271820068359375, 0.025665283203125, 0.03861236572265625, 0.0515594482421875, 0.06450653076171875, 0.07745361328125, 0.09040069580078125, 0.1033477783203125, 0.11629486083984375, 0.129241943359375, 0.14218902587890625, 0.1551361083984375, 0.16808319091796875, 0.1810302734375, 0.19397735595703125, 0.2069244384765625, 0.21987152099609375, 0.232818603515625, 0.24576568603515625, 0.2587127685546875, 0.27165985107421875, 0.28460693359375, 0.29755401611328125, 0.3105010986328125, 0.32344818115234375, 0.336395263671875, 0.34934234619140625, 0.3622894287109375, 0.37523651123046875, 0.38818359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 3.0, 7.0, 4.0, 22.0, 20.0, 43.0, 68.0, 99.0, 135.0, 148.0, 128.0, 96.0, 72.0, 47.0, 26.0, 18.0, 15.0, 8.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014448165893554688, -0.00013858452439308167, -0.00013268738985061646, -0.00012679025530815125, -0.00012089312076568604, -0.00011499598622322083, -0.00010909885168075562, -0.0001032017171382904, -9.73045825958252e-05, -9.140744805335999e-05, -8.551031351089478e-05, -7.961317896842957e-05, -7.371604442596436e-05, -6.781890988349915e-05, -6.192177534103394e-05, -5.6024640798568726e-05, -5.0127506256103516e-05, -4.4230371713638306e-05, -3.8333237171173096e-05, -3.2436102628707886e-05, -2.6538968086242676e-05, -2.0641833543777466e-05, -1.4744699001312256e-05, -8.847564458847046e-06, -2.950429916381836e-06, 2.946704626083374e-06, 8.843839168548584e-06, 1.4740973711013794e-05, 2.0638108253479004e-05, 2.6535242795944214e-05, 3.2432377338409424e-05, 3.8329511880874634e-05, 4.4226646423339844e-05, 5.0123780965805054e-05, 5.6020915508270264e-05, 6.191805005073547e-05, 6.781518459320068e-05, 7.37123191356659e-05, 7.96094536781311e-05, 8.550658822059631e-05, 9.140372276306152e-05, 9.730085730552673e-05, 0.00010319799184799194, 0.00010909512639045715, 0.00011499226093292236, 0.00012088939547538757, 0.00012678653001785278, 0.000132683664560318, 0.0001385807991027832, 0.0001444779336452484, 0.00015037506818771362, 0.00015627220273017883, 0.00016216933727264404, 0.00016806647181510925, 0.00017396360635757446, 0.00017986074090003967, 0.00018575787544250488, 0.0001916550099849701, 0.0001975521445274353, 0.0002034492790699005, 0.00020934641361236572, 0.00021524354815483093, 0.00022114068269729614, 0.00022703781723976135, 0.00023293495178222656]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 11.0, 2.0, 8.0, 12.0, 27.0, 30.0, 62.0, 93.0, 205.0, 416.0, 917.0, 2073.0, 5704.0, 17141.0, 70970.0, 586793.0, 292936.0, 50098.0, 13293.0, 4482.0, 1752.0, 748.0, 338.0, 177.0, 100.0, 59.0, 39.0, 28.0, 12.0, 10.0, 8.0, 2.0, 3.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.56640625, -0.54864501953125, -0.5308837890625, -0.51312255859375, -0.495361328125, -0.47760009765625, -0.4598388671875, -0.44207763671875, -0.42431640625, -0.40655517578125, -0.3887939453125, -0.37103271484375, -0.353271484375, -0.33551025390625, -0.3177490234375, -0.29998779296875, -0.2822265625, -0.26446533203125, -0.2467041015625, -0.22894287109375, -0.211181640625, -0.19342041015625, -0.1756591796875, -0.15789794921875, -0.14013671875, -0.12237548828125, -0.1046142578125, -0.08685302734375, -0.069091796875, -0.05133056640625, -0.0335693359375, -0.01580810546875, 0.001953125, 0.01971435546875, 0.0374755859375, 0.05523681640625, 0.072998046875, 0.09075927734375, 0.1085205078125, 0.12628173828125, 0.14404296875, 0.16180419921875, 0.1795654296875, 0.19732666015625, 0.215087890625, 0.23284912109375, 0.2506103515625, 0.26837158203125, 0.2861328125, 0.30389404296875, 0.3216552734375, 0.33941650390625, 0.357177734375, 0.37493896484375, 0.3927001953125, 0.41046142578125, 0.42822265625, 0.44598388671875, 0.4637451171875, 0.48150634765625, 0.499267578125, 0.51702880859375, 0.5347900390625, 0.55255126953125, 0.5703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 6.0, 0.0, 3.0, 3.0, 2.0, 4.0, 5.0, 11.0, 8.0, 21.0, 21.0, 27.0, 30.0, 54.0, 65.0, 85.0, 103.0, 96.0, 98.0, 99.0, 63.0, 60.0, 43.0, 27.0, 16.0, 17.0, 13.0, 9.0, 3.0, 7.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62060546875, -0.6009597778320312, -0.5813140869140625, -0.5616683959960938, -0.542022705078125, -0.5223770141601562, -0.5027313232421875, -0.48308563232421875, -0.46343994140625, -0.44379425048828125, -0.4241485595703125, -0.40450286865234375, -0.384857177734375, -0.36521148681640625, -0.3455657958984375, -0.32592010498046875, -0.3062744140625, -0.28662872314453125, -0.2669830322265625, -0.24733734130859375, -0.227691650390625, -0.20804595947265625, -0.1884002685546875, -0.16875457763671875, -0.14910888671875, -0.12946319580078125, -0.1098175048828125, -0.09017181396484375, -0.070526123046875, -0.05088043212890625, -0.0312347412109375, -0.01158905029296875, 0.008056640625, 0.02770233154296875, 0.0473480224609375, 0.06699371337890625, 0.086639404296875, 0.10628509521484375, 0.1259307861328125, 0.14557647705078125, 0.16522216796875, 0.18486785888671875, 0.2045135498046875, 0.22415924072265625, 0.243804931640625, 0.26345062255859375, 0.2830963134765625, 0.30274200439453125, 0.3223876953125, 0.34203338623046875, 0.3616790771484375, 0.38132476806640625, 0.400970458984375, 0.42061614990234375, 0.4402618408203125, 0.45990753173828125, 0.47955322265625, 0.49919891357421875, 0.5188446044921875, 0.5384902954101562, 0.558135986328125, 0.5777816772460938, 0.5974273681640625, 0.6170730590820312, 0.63671875]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 6.0, 5.0, 7.0, 15.0, 36.0, 47.0, 101.0, 150.0, 259.0, 153.0, 92.0, 47.0, 32.0, 20.0, 9.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.970185279846191, -12.625527381896973, -12.28087043762207, -11.936212539672852, -11.591554641723633, -11.246896743774414, -10.902239799499512, -10.557581901550293, -10.21292495727539, -9.868267059326172, -9.52361011505127, -9.17895221710205, -8.834294319152832, -8.48963737487793, -8.144979476928711, -7.800321578979492, -7.455663681030273, -7.111006259918213, -6.766348361968994, -6.421690940856934, -6.077033042907715, -5.732375621795654, -5.387718200683594, -5.043060302734375, -4.6984028816223145, -4.353745460510254, -4.009087562561035, -3.6644301414489746, -3.319772481918335, -2.9751148223876953, -2.6304574012756348, -2.285799741744995, -1.9411430358886719, -1.5964853763580322, -1.2518278360366821, -0.907170295715332, -0.5625126361846924, -0.21785497665405273, 0.1268024444580078, 0.47146010398864746, 0.8161177635192871, 1.1607754230499268, 1.5054329633712769, 1.850090503692627, 2.1947481632232666, 2.5394058227539062, 2.884063243865967, 3.2287209033966064, 3.573378562927246, 3.9180362224578857, 4.262693881988525, 4.607351303100586, 4.952009201049805, 5.296666622161865, 5.641324043273926, 5.9859819412231445, 6.330639362335205, 6.675296783447266, 7.019954681396484, 7.364612102508545, 7.7092695236206055, 8.053927421569824, 8.398584365844727, 8.743242263793945, 9.087900161743164]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 10.0, 15.0, 17.0, 23.0, 21.0, 27.0, 30.0, 42.0, 51.0, 59.0, 60.0, 94.0, 106.0, 80.0, 65.0, 46.0, 39.0, 28.0, 30.0, 27.0, 23.0, 21.0, 19.0, 15.0, 10.0, 6.0, 8.0, 8.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.64122486114502, -13.284805297851562, -12.928386688232422, -12.571967124938965, -12.215548515319824, -11.859128952026367, -11.502710342407227, -11.14629077911377, -10.789871215820312, -10.433451652526855, -10.077033042907715, -9.720613479614258, -9.364194869995117, -9.00777530670166, -8.651355743408203, -8.294937133789062, -7.938518524169922, -7.582099437713623, -7.225680351257324, -6.869260787963867, -6.512842178344727, -6.1564226150512695, -5.800003528594971, -5.443584442138672, -5.087165355682373, -4.730746269226074, -4.374327182769775, -4.017908096313477, -3.6614887714385986, -3.3050696849823, -2.948650360107422, -2.592231273651123, -2.2358131408691406, -1.8793940544128418, -1.5229748487472534, -1.166555643081665, -0.8101365566253662, -0.4537174701690674, -0.09729814529418945, 0.2591209411621094, 0.6155400276184082, 0.9719591736793518, 1.3283783197402954, 1.6847975254058838, 2.0412166118621826, 2.3976356983184814, 2.7540550231933594, 3.110474109649658, 3.466893196105957, 3.823312282562256, 4.179731369018555, 4.536150932312012, 4.892569541931152, 5.248989105224609, 5.605408191680908, 5.961827278137207, 6.318246364593506, 6.674665451049805, 7.0310845375061035, 7.387503623962402, 7.743923187255859, 8.100341796875, 8.456761360168457, 8.813180923461914, 9.169599533081055]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 5.0, 15.0, 9.0, 23.0, 21.0, 44.0, 43.0, 80.0, 109.0, 152.0, 276.0, 522.0, 885.0, 1900.0, 4244.0, 10962.0, 34231.0, 159452.0, 1124853.0, 2289292.0, 464373.0, 72967.0, 17922.0, 6118.0, 2590.0, 1315.0, 674.0, 388.0, 269.0, 165.0, 102.0, 64.0, 53.0, 49.0, 36.0, 18.0, 13.0, 13.0, 10.0, 3.0, 5.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.6806640625, -0.6588973999023438, -0.6371307373046875, -0.6153640747070312, -0.593597412109375, -0.5718307495117188, -0.5500640869140625, -0.5282974243164062, -0.50653076171875, -0.48476409912109375, -0.4629974365234375, -0.44123077392578125, -0.419464111328125, -0.39769744873046875, -0.3759307861328125, -0.35416412353515625, -0.3323974609375, -0.31063079833984375, -0.2888641357421875, -0.26709747314453125, -0.245330810546875, -0.22356414794921875, -0.2017974853515625, -0.18003082275390625, -0.15826416015625, -0.13649749755859375, -0.1147308349609375, -0.09296417236328125, -0.071197509765625, -0.04943084716796875, -0.0276641845703125, -0.00589752197265625, 0.015869140625, 0.03763580322265625, 0.0594024658203125, 0.08116912841796875, 0.102935791015625, 0.12470245361328125, 0.1464691162109375, 0.16823577880859375, 0.19000244140625, 0.21176910400390625, 0.2335357666015625, 0.25530242919921875, 0.277069091796875, 0.29883575439453125, 0.3206024169921875, 0.34236907958984375, 0.3641357421875, 0.38590240478515625, 0.4076690673828125, 0.42943572998046875, 0.451202392578125, 0.47296905517578125, 0.4947357177734375, 0.5165023803710938, 0.53826904296875, 0.5600357055664062, 0.5818023681640625, 0.6035690307617188, 0.625335693359375, 0.6471023559570312, 0.6688690185546875, 0.6906356811523438, 0.71240234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 8.0, 8.0, 3.0, 5.0, 20.0, 27.0, 23.0, 39.0, 57.0, 53.0, 70.0, 64.0, 78.0, 71.0, 69.0, 86.0, 69.0, 63.0, 53.0, 40.0, 29.0, 24.0, 17.0, 11.0, 7.0, 6.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81689453125, -0.7862319946289062, -0.7555694580078125, -0.7249069213867188, -0.694244384765625, -0.6635818481445312, -0.6329193115234375, -0.6022567749023438, -0.57159423828125, -0.5409317016601562, -0.5102691650390625, -0.47960662841796875, -0.448944091796875, -0.41828155517578125, -0.3876190185546875, -0.35695648193359375, -0.3262939453125, -0.29563140869140625, -0.2649688720703125, -0.23430633544921875, -0.203643798828125, -0.17298126220703125, -0.1423187255859375, -0.11165618896484375, -0.08099365234375, -0.05033111572265625, -0.0196685791015625, 0.01099395751953125, 0.041656494140625, 0.07231903076171875, 0.1029815673828125, 0.13364410400390625, 0.164306640625, 0.19496917724609375, 0.2256317138671875, 0.25629425048828125, 0.286956787109375, 0.31761932373046875, 0.3482818603515625, 0.37894439697265625, 0.40960693359375, 0.44026947021484375, 0.4709320068359375, 0.5015945434570312, 0.532257080078125, 0.5629196166992188, 0.5935821533203125, 0.6242446899414062, 0.6549072265625, 0.6855697631835938, 0.7162322998046875, 0.7468948364257812, 0.777557373046875, 0.8082199096679688, 0.8388824462890625, 0.8695449829101562, 0.90020751953125, 0.9308700561523438, 0.9615325927734375, 0.9921951293945312, 1.022857666015625, 1.0535202026367188, 1.0841827392578125, 1.1148452758789062, 1.1455078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 3.0, 8.0, 10.0, 18.0, 41.0, 47.0, 72.0, 115.0, 222.0, 378.0, 824.0, 2442.0, 14720.0, 500994.0, 3612383.0, 54657.0, 4860.0, 1270.0, 470.0, 294.0, 161.0, 85.0, 70.0, 42.0, 28.0, 23.0, 12.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6630859375, -1.5971832275390625, -1.531280517578125, -1.4653778076171875, -1.39947509765625, -1.3335723876953125, -1.267669677734375, -1.2017669677734375, -1.1358642578125, -1.0699615478515625, -1.004058837890625, -0.9381561279296875, -0.87225341796875, -0.8063507080078125, -0.740447998046875, -0.6745452880859375, -0.608642578125, -0.5427398681640625, -0.476837158203125, -0.4109344482421875, -0.34503173828125, -0.2791290283203125, -0.213226318359375, -0.1473236083984375, -0.0814208984375, -0.0155181884765625, 0.050384521484375, 0.1162872314453125, 0.18218994140625, 0.2480926513671875, 0.313995361328125, 0.3798980712890625, 0.44580078125, 0.5117034912109375, 0.577606201171875, 0.6435089111328125, 0.70941162109375, 0.7753143310546875, 0.841217041015625, 0.9071197509765625, 0.9730224609375, 1.0389251708984375, 1.104827880859375, 1.1707305908203125, 1.23663330078125, 1.3025360107421875, 1.368438720703125, 1.4343414306640625, 1.500244140625, 1.5661468505859375, 1.632049560546875, 1.6979522705078125, 1.76385498046875, 1.8297576904296875, 1.895660400390625, 1.9615631103515625, 2.0274658203125, 2.0933685302734375, 2.159271240234375, 2.2251739501953125, 2.29107666015625, 2.3569793701171875, 2.422882080078125, 2.4887847900390625, 2.5546875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 6.0, 7.0, 14.0, 24.0, 38.0, 68.0, 92.0, 174.0, 321.0, 575.0, 897.0, 753.0, 471.0, 287.0, 122.0, 75.0, 54.0, 32.0, 15.0, 15.0, 11.0, 6.0, 2.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.19140625, -1.1453857421875, -1.099365234375, -1.0533447265625, -1.00732421875, -0.9613037109375, -0.915283203125, -0.8692626953125, -0.8232421875, -0.7772216796875, -0.731201171875, -0.6851806640625, -0.63916015625, -0.5931396484375, -0.547119140625, -0.5010986328125, -0.455078125, -0.4090576171875, -0.363037109375, -0.3170166015625, -0.27099609375, -0.2249755859375, -0.178955078125, -0.1329345703125, -0.0869140625, -0.0408935546875, 0.005126953125, 0.0511474609375, 0.09716796875, 0.1431884765625, 0.189208984375, 0.2352294921875, 0.28125, 0.3272705078125, 0.373291015625, 0.4193115234375, 0.46533203125, 0.5113525390625, 0.557373046875, 0.6033935546875, 0.6494140625, 0.6954345703125, 0.741455078125, 0.7874755859375, 0.83349609375, 0.8795166015625, 0.925537109375, 0.9715576171875, 1.017578125, 1.0635986328125, 1.109619140625, 1.1556396484375, 1.20166015625, 1.2476806640625, 1.293701171875, 1.3397216796875, 1.3857421875, 1.4317626953125, 1.477783203125, 1.5238037109375, 1.56982421875, 1.6158447265625, 1.661865234375, 1.7078857421875, 1.75390625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 9.0, 17.0, 38.0, 84.0, 150.0, 227.0, 197.0, 131.0, 60.0, 36.0, 22.0, 11.0, 4.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.440969467163086, -13.988790512084961, -13.536611557006836, -13.084432601928711, -12.63225269317627, -12.180073738098145, -11.72789478302002, -11.275715827941895, -10.823535919189453, -10.371356964111328, -9.919178009033203, -9.466999053955078, -9.014819145202637, -8.562640190124512, -8.110461235046387, -7.658282279968262, -7.206103324890137, -6.753924369812012, -6.3017449378967285, -5.8495659828186035, -5.39738655090332, -4.945207595825195, -4.49302864074707, -4.040849685668945, -3.588670253753662, -3.136491060256958, -2.684311866760254, -2.232132911682129, -1.7799537181854248, -1.3277745246887207, -0.8755955696105957, -0.4234163761138916, 0.028763771057128906, 0.48094290494918823, 0.9331220388412476, 1.385301113128662, 1.8374803066253662, 2.2896595001220703, 2.7418384552001953, 3.1940176486968994, 3.6461968421936035, 4.0983757972717285, 4.550555229187012, 5.002734184265137, 5.454913139343262, 5.907092571258545, 6.35927152633667, 6.811450958251953, 7.263629913330078, 7.715808868408203, 8.167987823486328, 8.620166778564453, 9.072346687316895, 9.52452564239502, 9.976704597473145, 10.42888355255127, 10.881063461303711, 11.333242416381836, 11.785421371459961, 12.237600326538086, 12.689780235290527, 13.141959190368652, 13.594138145446777, 14.046317100524902, 14.498496055603027]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 4.0, 10.0, 10.0, 11.0, 12.0, 8.0, 9.0, 16.0, 23.0, 26.0, 37.0, 21.0, 26.0, 38.0, 26.0, 44.0, 42.0, 48.0, 61.0, 41.0, 41.0, 49.0, 49.0, 34.0, 40.0, 37.0, 35.0, 24.0, 27.0, 13.0, 26.0, 29.0, 13.0, 9.0, 10.0, 8.0, 10.0, 10.0, 6.0, 3.0, 6.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.305628776550293, -5.149790287017822, -4.993951320648193, -4.838112831115723, -4.682273864746094, -4.526435375213623, -4.370596408843994, -4.214757919311523, -4.0589189529418945, -3.9030802249908447, -3.747241497039795, -3.591402769088745, -3.4355640411376953, -3.2797255516052246, -3.123886823654175, -2.968048095703125, -2.8122096061706543, -2.6563708782196045, -2.5005321502685547, -2.344693422317505, -2.188854694366455, -2.0330162048339844, -1.8771774768829346, -1.7213387489318848, -1.565500020980835, -1.4096612930297852, -1.2538225650787354, -1.097983956336975, -0.9421452283859253, -0.7863065004348755, -0.6304678320884705, -0.47462916374206543, -0.3187899589538574, -0.16295126080513, -0.007112562656402588, 0.14872613549232483, 0.30456483364105225, 0.46040356159210205, 0.6162422299385071, 0.7720808982849121, 0.9279196262359619, 1.0837583541870117, 1.2395970821380615, 1.3954356908798218, 1.5512744188308716, 1.7071131467819214, 1.8629517555236816, 2.0187904834747314, 2.1746292114257812, 2.330467939376831, 2.486306667327881, 2.6421453952789307, 2.7979841232299805, 2.953822612762451, 3.109661340713501, 3.265500068664551, 3.4213387966156006, 3.5771775245666504, 3.7330162525177, 3.88885498046875, 4.044693470001221, 4.20053243637085, 4.35637092590332, 4.512209892272949, 4.66804838180542]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 3.0, 9.0, 5.0, 13.0, 14.0, 22.0, 34.0, 54.0, 95.0, 152.0, 269.0, 514.0, 921.0, 2223.0, 5999.0, 18701.0, 74176.0, 345766.0, 455191.0, 105970.0, 25520.0, 7638.0, 2745.0, 1209.0, 581.0, 314.0, 172.0, 99.0, 51.0, 36.0, 24.0, 16.0, 10.0, 6.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85595703125, -0.8243942260742188, -0.7928314208984375, -0.7612686157226562, -0.729705810546875, -0.6981430053710938, -0.6665802001953125, -0.6350173950195312, -0.60345458984375, -0.5718917846679688, -0.5403289794921875, -0.5087661743164062, -0.477203369140625, -0.44564056396484375, -0.4140777587890625, -0.38251495361328125, -0.3509521484375, -0.31938934326171875, -0.2878265380859375, -0.25626373291015625, -0.224700927734375, -0.19313812255859375, -0.1615753173828125, -0.13001251220703125, -0.09844970703125, -0.06688690185546875, -0.0353240966796875, -0.00376129150390625, 0.027801513671875, 0.05936431884765625, 0.0909271240234375, 0.12248992919921875, 0.154052734375, 0.18561553955078125, 0.2171783447265625, 0.24874114990234375, 0.280303955078125, 0.31186676025390625, 0.3434295654296875, 0.37499237060546875, 0.40655517578125, 0.43811798095703125, 0.4696807861328125, 0.5012435913085938, 0.532806396484375, 0.5643692016601562, 0.5959320068359375, 0.6274948120117188, 0.6590576171875, 0.6906204223632812, 0.7221832275390625, 0.7537460327148438, 0.785308837890625, 0.8168716430664062, 0.8484344482421875, 0.8799972534179688, 0.91156005859375, 0.9431228637695312, 0.9746856689453125, 1.0062484741210938, 1.037811279296875, 1.0693740844726562, 1.1009368896484375, 1.1324996948242188, 1.1640625]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 6.0, 6.0, 10.0, 14.0, 19.0, 22.0, 34.0, 39.0, 42.0, 50.0, 66.0, 67.0, 72.0, 71.0, 67.0, 94.0, 52.0, 55.0, 55.0, 45.0, 39.0, 23.0, 25.0, 14.0, 6.0, 2.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.8071060180664062, -0.7768096923828125, -0.7465133666992188, -0.716217041015625, -0.6859207153320312, -0.6556243896484375, -0.6253280639648438, -0.59503173828125, -0.5647354125976562, -0.5344390869140625, -0.5041427612304688, -0.473846435546875, -0.44355010986328125, -0.4132537841796875, -0.38295745849609375, -0.3526611328125, -0.32236480712890625, -0.2920684814453125, -0.26177215576171875, -0.231475830078125, -0.20117950439453125, -0.1708831787109375, -0.14058685302734375, -0.11029052734375, -0.07999420166015625, -0.0496978759765625, -0.01940155029296875, 0.010894775390625, 0.04119110107421875, 0.0714874267578125, 0.10178375244140625, 0.132080078125, 0.16237640380859375, 0.1926727294921875, 0.22296905517578125, 0.253265380859375, 0.28356170654296875, 0.3138580322265625, 0.34415435791015625, 0.37445068359375, 0.40474700927734375, 0.4350433349609375, 0.46533966064453125, 0.495635986328125, 0.5259323120117188, 0.5562286376953125, 0.5865249633789062, 0.6168212890625, 0.6471176147460938, 0.6774139404296875, 0.7077102661132812, 0.738006591796875, 0.7683029174804688, 0.7985992431640625, 0.8288955688476562, 0.85919189453125, 0.8894882202148438, 0.9197845458984375, 0.9500808715820312, 0.980377197265625, 1.0106735229492188, 1.0409698486328125, 1.0712661743164062, 1.1015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 16.0, 24.0, 40.0, 87.0, 168.0, 428.0, 1270.0, 7055.0, 195892.0, 821695.0, 18702.0, 2104.0, 586.0, 259.0, 114.0, 60.0, 27.0, 22.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.619140625, -2.5323486328125, -2.445556640625, -2.3587646484375, -2.27197265625, -2.1851806640625, -2.098388671875, -2.0115966796875, -1.9248046875, -1.8380126953125, -1.751220703125, -1.6644287109375, -1.57763671875, -1.4908447265625, -1.404052734375, -1.3172607421875, -1.23046875, -1.1436767578125, -1.056884765625, -0.9700927734375, -0.88330078125, -0.7965087890625, -0.709716796875, -0.6229248046875, -0.5361328125, -0.4493408203125, -0.362548828125, -0.2757568359375, -0.18896484375, -0.1021728515625, -0.015380859375, 0.0714111328125, 0.158203125, 0.2449951171875, 0.331787109375, 0.4185791015625, 0.50537109375, 0.5921630859375, 0.678955078125, 0.7657470703125, 0.8525390625, 0.9393310546875, 1.026123046875, 1.1129150390625, 1.19970703125, 1.2864990234375, 1.373291015625, 1.4600830078125, 1.546875, 1.6336669921875, 1.720458984375, 1.8072509765625, 1.89404296875, 1.9808349609375, 2.067626953125, 2.1544189453125, 2.2412109375, 2.3280029296875, 2.414794921875, 2.5015869140625, 2.58837890625, 2.6751708984375, 2.761962890625, 2.8487548828125, 2.935546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 2.0, 7.0, 5.0, 6.0, 16.0, 9.0, 21.0, 15.0, 17.0, 29.0, 24.0, 41.0, 42.0, 42.0, 49.0, 42.0, 58.0, 71.0, 56.0, 49.0, 45.0, 35.0, 51.0, 32.0, 37.0, 33.0, 27.0, 18.0, 20.0, 19.0, 22.0, 12.0, 9.0, 10.0, 2.0, 8.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.161651611328125, -2.08892822265625, -2.016204833984375, -1.9434814453125, -1.870758056640625, -1.79803466796875, -1.725311279296875, -1.652587890625, -1.579864501953125, -1.50714111328125, -1.434417724609375, -1.3616943359375, -1.288970947265625, -1.21624755859375, -1.143524169921875, -1.07080078125, -0.998077392578125, -0.92535400390625, -0.852630615234375, -0.7799072265625, -0.707183837890625, -0.63446044921875, -0.561737060546875, -0.489013671875, -0.416290283203125, -0.34356689453125, -0.270843505859375, -0.1981201171875, -0.125396728515625, -0.05267333984375, 0.020050048828125, 0.0927734375, 0.165496826171875, 0.23822021484375, 0.310943603515625, 0.3836669921875, 0.456390380859375, 0.52911376953125, 0.601837158203125, 0.674560546875, 0.747283935546875, 0.82000732421875, 0.892730712890625, 0.9654541015625, 1.038177490234375, 1.11090087890625, 1.183624267578125, 1.25634765625, 1.329071044921875, 1.40179443359375, 1.474517822265625, 1.5472412109375, 1.619964599609375, 1.69268798828125, 1.765411376953125, 1.838134765625, 1.910858154296875, 1.98358154296875, 2.056304931640625, 2.1290283203125, 2.201751708984375, 2.27447509765625, 2.347198486328125, 2.419921875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 8.0, 16.0, 24.0, 29.0, 66.0, 94.0, 172.0, 343.0, 717.0, 1682.0, 3934.0, 11640.0, 41909.0, 223032.0, 671676.0, 66639.0, 17045.0, 5522.0, 2077.0, 953.0, 428.0, 230.0, 111.0, 70.0, 46.0, 30.0, 28.0, 12.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59619140625, -0.5750198364257812, -0.5538482666015625, -0.5326766967773438, -0.511505126953125, -0.49033355712890625, -0.4691619873046875, -0.44799041748046875, -0.42681884765625, -0.40564727783203125, -0.3844757080078125, -0.36330413818359375, -0.342132568359375, -0.32096099853515625, -0.2997894287109375, -0.27861785888671875, -0.2574462890625, -0.23627471923828125, -0.2151031494140625, -0.19393157958984375, -0.172760009765625, -0.15158843994140625, -0.1304168701171875, -0.10924530029296875, -0.08807373046875, -0.06690216064453125, -0.0457305908203125, -0.02455902099609375, -0.003387451171875, 0.01778411865234375, 0.0389556884765625, 0.06012725830078125, 0.081298828125, 0.10247039794921875, 0.1236419677734375, 0.14481353759765625, 0.165985107421875, 0.18715667724609375, 0.2083282470703125, 0.22949981689453125, 0.25067138671875, 0.27184295654296875, 0.2930145263671875, 0.31418609619140625, 0.335357666015625, 0.35652923583984375, 0.3777008056640625, 0.39887237548828125, 0.4200439453125, 0.44121551513671875, 0.4623870849609375, 0.48355865478515625, 0.504730224609375, 0.5259017944335938, 0.5470733642578125, 0.5682449340820312, 0.58941650390625, 0.6105880737304688, 0.6317596435546875, 0.6529312133789062, 0.674102783203125, 0.6952743530273438, 0.7164459228515625, 0.7376174926757812, 0.7587890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 6.0, 5.0, 5.0, 7.0, 3.0, 8.0, 6.0, 18.0, 19.0, 26.0, 48.0, 44.0, 88.0, 135.0, 185.0, 121.0, 73.0, 56.0, 49.0, 23.0, 19.0, 17.0, 7.0, 10.0, 8.0, 4.0, 4.0, 6.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002276897430419922, -0.0002216137945652008, -0.00021553784608840942, -0.00020946189761161804, -0.00020338594913482666, -0.00019731000065803528, -0.0001912340521812439, -0.00018515810370445251, -0.00017908215522766113, -0.00017300620675086975, -0.00016693025827407837, -0.000160854309797287, -0.0001547783613204956, -0.00014870241284370422, -0.00014262646436691284, -0.00013655051589012146, -0.00013047456741333008, -0.0001243986189365387, -0.00011832267045974731, -0.00011224672198295593, -0.00010617077350616455, -0.00010009482502937317, -9.401887655258179e-05, -8.79429280757904e-05, -8.186697959899902e-05, -7.579103112220764e-05, -6.971508264541626e-05, -6.363913416862488e-05, -5.7563185691833496e-05, -5.1487237215042114e-05, -4.541128873825073e-05, -3.933534026145935e-05, -3.325939178466797e-05, -2.7183443307876587e-05, -2.1107494831085205e-05, -1.5031546354293823e-05, -8.955597877502441e-06, -2.8796494007110596e-06, 3.1962990760803223e-06, 9.272247552871704e-06, 1.5348196029663086e-05, 2.1424144506454468e-05, 2.750009298324585e-05, 3.357604146003723e-05, 3.965198993682861e-05, 4.5727938413619995e-05, 5.180388689041138e-05, 5.787983536720276e-05, 6.395578384399414e-05, 7.003173232078552e-05, 7.61076807975769e-05, 8.218362927436829e-05, 8.825957775115967e-05, 9.433552622795105e-05, 0.00010041147470474243, 0.00010648742318153381, 0.0001125633716583252, 0.00011863932013511658, 0.00012471526861190796, 0.00013079121708869934, 0.00013686716556549072, 0.0001429431140422821, 0.00014901906251907349, 0.00015509501099586487, 0.00016117095947265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 2.0, 2.0, 2.0, 6.0, 3.0, 10.0, 12.0, 20.0, 19.0, 35.0, 50.0, 85.0, 123.0, 175.0, 267.0, 441.0, 735.0, 1396.0, 2916.0, 6653.0, 17862.0, 54800.0, 232572.0, 608464.0, 80922.0, 24487.0, 8794.0, 3648.0, 1744.0, 869.0, 526.0, 322.0, 202.0, 117.0, 83.0, 56.0, 32.0, 25.0, 27.0, 13.0, 18.0, 7.0, 8.0, 6.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.445068359375, -0.4286766052246094, -0.41228485107421875, -0.3958930969238281, -0.3795013427734375, -0.3631095886230469, -0.34671783447265625, -0.3303260803222656, -0.313934326171875, -0.2975425720214844, -0.28115081787109375, -0.2647590637207031, -0.2483673095703125, -0.23197555541992188, -0.21558380126953125, -0.19919204711914062, -0.18280029296875, -0.16640853881835938, -0.15001678466796875, -0.13362503051757812, -0.1172332763671875, -0.10084152221679688, -0.08444976806640625, -0.06805801391601562, -0.051666259765625, -0.035274505615234375, -0.01888275146484375, -0.002490997314453125, 0.0139007568359375, 0.030292510986328125, 0.04668426513671875, 0.06307601928710938, 0.0794677734375, 0.09585952758789062, 0.11225128173828125, 0.12864303588867188, 0.1450347900390625, 0.16142654418945312, 0.17781829833984375, 0.19421005249023438, 0.210601806640625, 0.22699356079101562, 0.24338531494140625, 0.2597770690917969, 0.2761688232421875, 0.2925605773925781, 0.30895233154296875, 0.3253440856933594, 0.34173583984375, 0.3581275939941406, 0.37451934814453125, 0.3909111022949219, 0.4073028564453125, 0.4236946105957031, 0.44008636474609375, 0.4564781188964844, 0.472869873046875, 0.4892616271972656, 0.5056533813476562, 0.5220451354980469, 0.5384368896484375, 0.5548286437988281, 0.5712203979492188, 0.5876121520996094, 0.60400390625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 8.0, 5.0, 8.0, 5.0, 13.0, 15.0, 20.0, 25.0, 24.0, 43.0, 52.0, 71.0, 101.0, 125.0, 118.0, 90.0, 75.0, 52.0, 32.0, 27.0, 24.0, 18.0, 15.0, 9.0, 9.0, 4.0, 3.0, 6.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6376953125, -0.6177215576171875, -0.597747802734375, -0.5777740478515625, -0.55780029296875, -0.5378265380859375, -0.517852783203125, -0.4978790283203125, -0.4779052734375, -0.4579315185546875, -0.437957763671875, -0.4179840087890625, -0.39801025390625, -0.3780364990234375, -0.358062744140625, -0.3380889892578125, -0.318115234375, -0.2981414794921875, -0.278167724609375, -0.2581939697265625, -0.23822021484375, -0.2182464599609375, -0.198272705078125, -0.1782989501953125, -0.1583251953125, -0.1383514404296875, -0.118377685546875, -0.0984039306640625, -0.07843017578125, -0.0584564208984375, -0.038482666015625, -0.0185089111328125, 0.00146484375, 0.0214385986328125, 0.041412353515625, 0.0613861083984375, 0.08135986328125, 0.1013336181640625, 0.121307373046875, 0.1412811279296875, 0.1612548828125, 0.1812286376953125, 0.201202392578125, 0.2211761474609375, 0.24114990234375, 0.2611236572265625, 0.281097412109375, 0.3010711669921875, 0.321044921875, 0.3410186767578125, 0.360992431640625, 0.3809661865234375, 0.40093994140625, 0.4209136962890625, 0.440887451171875, 0.4608612060546875, 0.4808349609375, 0.5008087158203125, 0.520782470703125, 0.5407562255859375, 0.56072998046875, 0.5807037353515625, 0.600677490234375, 0.6206512451171875, 0.640625]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 6.0, 4.0, 10.0, 24.0, 80.0, 205.0, 425.0, 135.0, 61.0, 29.0, 10.0, 9.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-26.249160766601562, -25.562265396118164, -24.8753719329834, -24.1884765625, -23.5015811920166, -22.814685821533203, -22.127792358398438, -21.44089698791504, -20.75400161743164, -20.067106246948242, -19.380212783813477, -18.693317413330078, -18.00642204284668, -17.31952667236328, -16.632633209228516, -15.945737838745117, -15.258843421936035, -14.571949005126953, -13.885053634643555, -13.198159217834473, -12.511263847351074, -11.824369430541992, -11.137474060058594, -10.450579643249512, -9.76368522644043, -9.076790809631348, -8.38989543914795, -7.703001022338867, -7.016105651855469, -6.329211235046387, -5.6423163414001465, -4.955421447753906, -4.268526077270508, -3.5816311836242676, -2.8947362899780273, -2.207841634750366, -1.520946741104126, -0.8340518474578857, -0.1471571922302246, 0.5397377014160156, 1.2266325950622559, 1.913527488708496, 2.6004223823547363, 3.2873170375823975, 3.9742119312286377, 4.661107063293457, 5.348001480102539, 6.034896373748779, 6.7217912673950195, 7.40868616104126, 8.0955810546875, 8.782475471496582, 9.46937084197998, 10.156265258789062, 10.843160629272461, 11.530055046081543, 12.216949462890625, 12.903843879699707, 13.590739250183105, 14.277633666992188, 14.964529037475586, 15.651423454284668, 16.33831787109375, 17.02521324157715, 17.712108612060547]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 7.0, 13.0, 15.0, 26.0, 18.0, 23.0, 30.0, 31.0, 40.0, 35.0, 44.0, 62.0, 87.0, 103.0, 84.0, 62.0, 43.0, 37.0, 29.0, 37.0, 22.0, 16.0, 16.0, 18.0, 14.0, 23.0, 10.0, 10.0, 5.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.228416442871094, -8.936429023742676, -8.644441604614258, -8.352453231811523, -8.060465812683105, -7.7684783935546875, -7.476490497589111, -7.184502601623535, -6.892515182495117, -6.600527763366699, -6.308539867401123, -6.016551971435547, -5.724564552307129, -5.432577133178711, -5.140589237213135, -4.848601341247559, -4.556613922119141, -4.264626502990723, -3.9726386070251465, -3.6806509494781494, -3.3886632919311523, -3.0966756343841553, -2.804687976837158, -2.512700319290161, -2.220712661743164, -1.928725004196167, -1.63673734664917, -1.3447496891021729, -1.0527620315551758, -0.7607743740081787, -0.46878671646118164, -0.17679905891418457, 0.1151876449584961, 0.40717530250549316, 0.6991629600524902, 0.9911506175994873, 1.2831382751464844, 1.5751259326934814, 1.8671135902404785, 2.1591012477874756, 2.4510889053344727, 2.7430765628814697, 3.035064220428467, 3.327051877975464, 3.619039535522461, 3.911027193069458, 4.203014850616455, 4.495002746582031, 4.786990165710449, 5.078977584838867, 5.370965480804443, 5.6629533767700195, 5.9549407958984375, 6.2469282150268555, 6.538916110992432, 6.830904006958008, 7.122891426086426, 7.414878845214844, 7.70686674118042, 7.998854637145996, 8.290842056274414, 8.582829475402832, 8.87481689453125, 9.166805267333984, 9.458792686462402]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 7.0, 2.0, 15.0, 17.0, 25.0, 36.0, 45.0, 55.0, 94.0, 133.0, 180.0, 386.0, 679.0, 1270.0, 3037.0, 8698.0, 31964.0, 180696.0, 1406770.0, 2151722.0, 340181.0, 49548.0, 11184.0, 3794.0, 1616.0, 841.0, 462.0, 258.0, 187.0, 104.0, 80.0, 68.0, 37.0, 21.0, 29.0, 18.0, 7.0, 6.0, 5.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8447265625, -0.819244384765625, -0.79376220703125, -0.768280029296875, -0.7427978515625, -0.717315673828125, -0.69183349609375, -0.666351318359375, -0.640869140625, -0.615386962890625, -0.58990478515625, -0.564422607421875, -0.5389404296875, -0.513458251953125, -0.48797607421875, -0.462493896484375, -0.43701171875, -0.411529541015625, -0.38604736328125, -0.360565185546875, -0.3350830078125, -0.309600830078125, -0.28411865234375, -0.258636474609375, -0.233154296875, -0.207672119140625, -0.18218994140625, -0.156707763671875, -0.1312255859375, -0.105743408203125, -0.08026123046875, -0.054779052734375, -0.029296875, -0.003814697265625, 0.02166748046875, 0.047149658203125, 0.0726318359375, 0.098114013671875, 0.12359619140625, 0.149078369140625, 0.174560546875, 0.200042724609375, 0.22552490234375, 0.251007080078125, 0.2764892578125, 0.301971435546875, 0.32745361328125, 0.352935791015625, 0.37841796875, 0.403900146484375, 0.42938232421875, 0.454864501953125, 0.4803466796875, 0.505828857421875, 0.53131103515625, 0.556793212890625, 0.582275390625, 0.607757568359375, 0.63323974609375, 0.658721923828125, 0.6842041015625, 0.709686279296875, 0.73516845703125, 0.760650634765625, 0.7861328125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 5.0, 2.0, 5.0, 5.0, 8.0, 11.0, 17.0, 31.0, 35.0, 49.0, 50.0, 57.0, 54.0, 64.0, 78.0, 80.0, 81.0, 75.0, 63.0, 64.0, 52.0, 29.0, 26.0, 20.0, 15.0, 14.0, 4.0, 7.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9091796875, -0.8780975341796875, -0.847015380859375, -0.8159332275390625, -0.78485107421875, -0.7537689208984375, -0.722686767578125, -0.6916046142578125, -0.6605224609375, -0.6294403076171875, -0.598358154296875, -0.5672760009765625, -0.53619384765625, -0.5051116943359375, -0.474029541015625, -0.4429473876953125, -0.411865234375, -0.3807830810546875, -0.349700927734375, -0.3186187744140625, -0.28753662109375, -0.2564544677734375, -0.225372314453125, -0.1942901611328125, -0.1632080078125, -0.1321258544921875, -0.101043701171875, -0.0699615478515625, -0.03887939453125, -0.0077972412109375, 0.023284912109375, 0.0543670654296875, 0.08544921875, 0.1165313720703125, 0.147613525390625, 0.1786956787109375, 0.20977783203125, 0.2408599853515625, 0.271942138671875, 0.3030242919921875, 0.3341064453125, 0.3651885986328125, 0.396270751953125, 0.4273529052734375, 0.45843505859375, 0.4895172119140625, 0.520599365234375, 0.5516815185546875, 0.582763671875, 0.6138458251953125, 0.644927978515625, 0.6760101318359375, 0.70709228515625, 0.7381744384765625, 0.769256591796875, 0.8003387451171875, 0.8314208984375, 0.8625030517578125, 0.893585205078125, 0.9246673583984375, 0.95574951171875, 0.9868316650390625, 1.017913818359375, 1.0489959716796875, 1.080078125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 12.0, 13.0, 19.0, 38.0, 88.0, 144.0, 298.0, 513.0, 1463.0, 11631.0, 3111727.0, 1058608.0, 7236.0, 1241.0, 521.0, 328.0, 185.0, 105.0, 42.0, 30.0, 17.0, 9.0, 15.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-4.76171875, -4.6533203125, -4.544921875, -4.4365234375, -4.328125, -4.2197265625, -4.111328125, -4.0029296875, -3.89453125, -3.7861328125, -3.677734375, -3.5693359375, -3.4609375, -3.3525390625, -3.244140625, -3.1357421875, -3.02734375, -2.9189453125, -2.810546875, -2.7021484375, -2.59375, -2.4853515625, -2.376953125, -2.2685546875, -2.16015625, -2.0517578125, -1.943359375, -1.8349609375, -1.7265625, -1.6181640625, -1.509765625, -1.4013671875, -1.29296875, -1.1845703125, -1.076171875, -0.9677734375, -0.859375, -0.7509765625, -0.642578125, -0.5341796875, -0.42578125, -0.3173828125, -0.208984375, -0.1005859375, 0.0078125, 0.1162109375, 0.224609375, 0.3330078125, 0.44140625, 0.5498046875, 0.658203125, 0.7666015625, 0.875, 0.9833984375, 1.091796875, 1.2001953125, 1.30859375, 1.4169921875, 1.525390625, 1.6337890625, 1.7421875, 1.8505859375, 1.958984375, 2.0673828125, 2.17578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 5.0, 8.0, 9.0, 16.0, 26.0, 50.0, 83.0, 196.0, 554.0, 1179.0, 1075.0, 518.0, 204.0, 78.0, 42.0, 25.0, 9.0, 6.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89404296875, -0.8196792602539062, -0.7453155517578125, -0.6709518432617188, -0.596588134765625, -0.5222244262695312, -0.4478607177734375, -0.37349700927734375, -0.29913330078125, -0.22476959228515625, -0.1504058837890625, -0.07604217529296875, -0.001678466796875, 0.07268524169921875, 0.1470489501953125, 0.22141265869140625, 0.2957763671875, 0.37014007568359375, 0.4445037841796875, 0.5188674926757812, 0.593231201171875, 0.6675949096679688, 0.7419586181640625, 0.8163223266601562, 0.89068603515625, 0.9650497436523438, 1.0394134521484375, 1.1137771606445312, 1.188140869140625, 1.2625045776367188, 1.3368682861328125, 1.4112319946289062, 1.485595703125, 1.5599594116210938, 1.6343231201171875, 1.7086868286132812, 1.783050537109375, 1.8574142456054688, 1.9317779541015625, 2.0061416625976562, 2.08050537109375, 2.1548690795898438, 2.2292327880859375, 2.3035964965820312, 2.377960205078125, 2.4523239135742188, 2.5266876220703125, 2.6010513305664062, 2.6754150390625, 2.7497787475585938, 2.8241424560546875, 2.8985061645507812, 2.972869873046875, 3.0472335815429688, 3.1215972900390625, 3.1959609985351562, 3.27032470703125, 3.3446884155273438, 3.4190521240234375, 3.4934158325195312, 3.567779541015625, 3.6421432495117188, 3.7165069580078125, 3.7908706665039062, 3.865234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 9.0, 19.0, 48.0, 96.0, 162.0, 223.0, 182.0, 132.0, 60.0, 23.0, 10.0, 12.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.602823257446289, -9.08700942993164, -8.571195602416992, -8.055381774902344, -7.539567470550537, -7.023753643035889, -6.507939338684082, -5.992125511169434, -5.476311683654785, -4.960497856140137, -4.444684028625488, -3.9288697242736816, -3.413055896759033, -2.8972420692443848, -2.3814280033111572, -1.8656139373779297, -1.3498001098632812, -0.8339861631393433, -0.3181722164154053, 0.19764173030853271, 0.7134556770324707, 1.2292695045471191, 1.7450835704803467, 2.260897636413574, 2.7767114639282227, 3.292525291442871, 3.8083393573760986, 4.324153423309326, 4.839967250823975, 5.355781078338623, 5.87159538269043, 6.387409210205078, 6.903224945068359, 7.419038772583008, 7.934852600097656, 8.450666427612305, 8.966480255126953, 9.482294082641602, 9.998108863830566, 10.513922691345215, 11.029736518859863, 11.545550346374512, 12.06136417388916, 12.577178001403809, 13.092992782592773, 13.608806610107422, 14.12462043762207, 14.640434265136719, 15.156248092651367, 15.672061920166016, 16.187875747680664, 16.703689575195312, 17.21950340270996, 17.73531723022461, 18.251131057739258, 18.766944885253906, 19.282760620117188, 19.798574447631836, 20.314388275146484, 20.830202102661133, 21.34601593017578, 21.86182975769043, 22.377643585205078, 22.89345932006836, 23.409271240234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 11.0, 8.0, 10.0, 12.0, 11.0, 14.0, 19.0, 38.0, 39.0, 34.0, 42.0, 50.0, 51.0, 62.0, 66.0, 57.0, 59.0, 55.0, 54.0, 46.0, 40.0, 42.0, 25.0, 25.0, 22.0, 22.0, 17.0, 9.0, 7.0, 4.0, 9.0, 2.0, 6.0, 4.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-9.808042526245117, -9.544102668762207, -9.280162811279297, -9.016222953796387, -8.752283096313477, -8.48834228515625, -8.224403381347656, -7.960463047027588, -7.6965227127075195, -7.432582855224609, -7.168642997741699, -6.904703140258789, -6.640762805938721, -6.3768229484558105, -6.1128830909729, -5.84894323348999, -5.58500337600708, -5.32106351852417, -5.05712366104126, -4.793183326721191, -4.529243469238281, -4.265303611755371, -4.001363754272461, -3.737423896789551, -3.4734838008880615, -3.2095439434051514, -2.945603847503662, -2.681663990020752, -2.417724132537842, -2.1537840366363525, -1.8898441791534424, -1.6259042024612427, -1.3619637489318848, -1.098023772239685, -0.8340838551521301, -0.5701439380645752, -0.3062039613723755, -0.04226398468017578, 0.22167587280273438, 0.4856158494949341, 0.7495558261871338, 1.0134958028793335, 1.2774357795715332, 1.5413756370544434, 1.805315613746643, 2.0692555904388428, 2.333195447921753, 2.597135543823242, 2.8610754013061523, 3.1250152587890625, 3.3889553546905518, 3.652895212173462, 3.916835308074951, 4.180775165557861, 4.4447150230407715, 4.708654880523682, 4.97259521484375, 5.23653507232666, 5.50047492980957, 5.7644147872924805, 6.028355121612549, 6.292294979095459, 6.556234836578369, 6.820174694061279, 7.0841145515441895]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 4.0, 3.0, 5.0, 9.0, 11.0, 17.0, 22.0, 35.0, 45.0, 88.0, 125.0, 217.0, 350.0, 711.0, 1430.0, 3066.0, 7720.0, 21794.0, 76294.0, 339881.0, 444782.0, 106501.0, 28805.0, 9472.0, 3728.0, 1611.0, 799.0, 409.0, 238.0, 117.0, 90.0, 63.0, 31.0, 24.0, 19.0, 13.0, 6.0, 9.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.9599609375, -0.9280853271484375, -0.896209716796875, -0.8643341064453125, -0.83245849609375, -0.8005828857421875, -0.768707275390625, -0.7368316650390625, -0.7049560546875, -0.6730804443359375, -0.641204833984375, -0.6093292236328125, -0.57745361328125, -0.5455780029296875, -0.513702392578125, -0.4818267822265625, -0.449951171875, -0.4180755615234375, -0.386199951171875, -0.3543243408203125, -0.32244873046875, -0.2905731201171875, -0.258697509765625, -0.2268218994140625, -0.1949462890625, -0.1630706787109375, -0.131195068359375, -0.0993194580078125, -0.06744384765625, -0.0355682373046875, -0.003692626953125, 0.0281829833984375, 0.06005859375, 0.0919342041015625, 0.123809814453125, 0.1556854248046875, 0.18756103515625, 0.2194366455078125, 0.251312255859375, 0.2831878662109375, 0.3150634765625, 0.3469390869140625, 0.378814697265625, 0.4106903076171875, 0.44256591796875, 0.4744415283203125, 0.506317138671875, 0.5381927490234375, 0.570068359375, 0.6019439697265625, 0.633819580078125, 0.6656951904296875, 0.69757080078125, 0.7294464111328125, 0.761322021484375, 0.7931976318359375, 0.8250732421875, 0.8569488525390625, 0.888824462890625, 0.9207000732421875, 0.95257568359375, 0.9844512939453125, 1.016326904296875, 1.0482025146484375, 1.080078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 3.0, 8.0, 6.0, 7.0, 13.0, 16.0, 23.0, 27.0, 35.0, 37.0, 41.0, 51.0, 53.0, 72.0, 49.0, 77.0, 60.0, 82.0, 61.0, 75.0, 41.0, 47.0, 34.0, 27.0, 17.0, 10.0, 10.0, 7.0, 4.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85888671875, -0.8277206420898438, -0.7965545654296875, -0.7653884887695312, -0.734222412109375, -0.7030563354492188, -0.6718902587890625, -0.6407241821289062, -0.60955810546875, -0.5783920288085938, -0.5472259521484375, -0.5160598754882812, -0.484893798828125, -0.45372772216796875, -0.4225616455078125, -0.39139556884765625, -0.3602294921875, -0.32906341552734375, -0.2978973388671875, -0.26673126220703125, -0.235565185546875, -0.20439910888671875, -0.1732330322265625, -0.14206695556640625, -0.11090087890625, -0.07973480224609375, -0.0485687255859375, -0.01740264892578125, 0.013763427734375, 0.04492950439453125, 0.0760955810546875, 0.10726165771484375, 0.138427734375, 0.16959381103515625, 0.2007598876953125, 0.23192596435546875, 0.263092041015625, 0.29425811767578125, 0.3254241943359375, 0.35659027099609375, 0.38775634765625, 0.41892242431640625, 0.4500885009765625, 0.48125457763671875, 0.512420654296875, 0.5435867309570312, 0.5747528076171875, 0.6059188842773438, 0.6370849609375, 0.6682510375976562, 0.6994171142578125, 0.7305831909179688, 0.761749267578125, 0.7929153442382812, 0.8240814208984375, 0.8552474975585938, 0.88641357421875, 0.9175796508789062, 0.9487457275390625, 0.9799118041992188, 1.011077880859375, 1.0422439575195312, 1.0734100341796875, 1.1045761108398438, 1.1357421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 6.0, 3.0, 8.0, 8.0, 11.0, 13.0, 12.0, 26.0, 24.0, 25.0, 45.0, 55.0, 96.0, 111.0, 136.0, 226.0, 350.0, 483.0, 900.0, 1853.0, 4938.0, 19399.0, 138512.0, 775646.0, 84433.0, 13659.0, 3724.0, 1544.0, 768.0, 457.0, 281.0, 219.0, 152.0, 109.0, 78.0, 66.0, 50.0, 36.0, 35.0, 19.0, 15.0, 7.0, 5.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.5322265625, -1.4834136962890625, -1.434600830078125, -1.3857879638671875, -1.33697509765625, -1.2881622314453125, -1.239349365234375, -1.1905364990234375, -1.1417236328125, -1.0929107666015625, -1.044097900390625, -0.9952850341796875, -0.94647216796875, -0.8976593017578125, -0.848846435546875, -0.8000335693359375, -0.751220703125, -0.7024078369140625, -0.653594970703125, -0.6047821044921875, -0.55596923828125, -0.5071563720703125, -0.458343505859375, -0.4095306396484375, -0.3607177734375, -0.3119049072265625, -0.263092041015625, -0.2142791748046875, -0.16546630859375, -0.1166534423828125, -0.067840576171875, -0.0190277099609375, 0.02978515625, 0.0785980224609375, 0.127410888671875, 0.1762237548828125, 0.22503662109375, 0.2738494873046875, 0.322662353515625, 0.3714752197265625, 0.4202880859375, 0.4691009521484375, 0.517913818359375, 0.5667266845703125, 0.61553955078125, 0.6643524169921875, 0.713165283203125, 0.7619781494140625, 0.810791015625, 0.8596038818359375, 0.908416748046875, 0.9572296142578125, 1.00604248046875, 1.0548553466796875, 1.103668212890625, 1.1524810791015625, 1.2012939453125, 1.2501068115234375, 1.298919677734375, 1.3477325439453125, 1.39654541015625, 1.4453582763671875, 1.494171142578125, 1.5429840087890625, 1.591796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 6.0, 8.0, 7.0, 15.0, 10.0, 15.0, 16.0, 28.0, 21.0, 27.0, 26.0, 52.0, 53.0, 48.0, 52.0, 50.0, 45.0, 58.0, 66.0, 52.0, 57.0, 46.0, 49.0, 27.0, 31.0, 21.0, 21.0, 23.0, 8.0, 13.0, 9.0, 11.0, 7.0, 7.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.408203125, -3.306488037109375, -3.20477294921875, -3.103057861328125, -3.0013427734375, -2.899627685546875, -2.79791259765625, -2.696197509765625, -2.594482421875, -2.492767333984375, -2.39105224609375, -2.289337158203125, -2.1876220703125, -2.085906982421875, -1.98419189453125, -1.882476806640625, -1.78076171875, -1.679046630859375, -1.57733154296875, -1.475616455078125, -1.3739013671875, -1.272186279296875, -1.17047119140625, -1.068756103515625, -0.967041015625, -0.865325927734375, -0.76361083984375, -0.661895751953125, -0.5601806640625, -0.458465576171875, -0.35675048828125, -0.255035400390625, -0.1533203125, -0.051605224609375, 0.05010986328125, 0.151824951171875, 0.2535400390625, 0.355255126953125, 0.45697021484375, 0.558685302734375, 0.660400390625, 0.762115478515625, 0.86383056640625, 0.965545654296875, 1.0672607421875, 1.168975830078125, 1.27069091796875, 1.372406005859375, 1.47412109375, 1.575836181640625, 1.67755126953125, 1.779266357421875, 1.8809814453125, 1.982696533203125, 2.08441162109375, 2.186126708984375, 2.287841796875, 2.389556884765625, 2.49127197265625, 2.592987060546875, 2.6947021484375, 2.796417236328125, 2.89813232421875, 2.999847412109375, 3.1015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 3.0, 5.0, 7.0, 6.0, 12.0, 17.0, 22.0, 35.0, 52.0, 61.0, 108.0, 155.0, 246.0, 462.0, 947.0, 2224.0, 5999.0, 23865.0, 178156.0, 767698.0, 51692.0, 10622.0, 3297.0, 1331.0, 660.0, 338.0, 173.0, 96.0, 68.0, 54.0, 35.0, 29.0, 24.0, 10.0, 8.0, 9.0, 2.0, 7.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.69677734375, -0.6769943237304688, -0.6572113037109375, -0.6374282836914062, -0.617645263671875, -0.5978622436523438, -0.5780792236328125, -0.5582962036132812, -0.53851318359375, -0.5187301635742188, -0.4989471435546875, -0.47916412353515625, -0.459381103515625, -0.43959808349609375, -0.4198150634765625, -0.40003204345703125, -0.3802490234375, -0.36046600341796875, -0.3406829833984375, -0.32089996337890625, -0.301116943359375, -0.28133392333984375, -0.2615509033203125, -0.24176788330078125, -0.22198486328125, -0.20220184326171875, -0.1824188232421875, -0.16263580322265625, -0.142852783203125, -0.12306976318359375, -0.1032867431640625, -0.08350372314453125, -0.063720703125, -0.04393768310546875, -0.0241546630859375, -0.00437164306640625, 0.015411376953125, 0.03519439697265625, 0.0549774169921875, 0.07476043701171875, 0.09454345703125, 0.11432647705078125, 0.1341094970703125, 0.15389251708984375, 0.173675537109375, 0.19345855712890625, 0.2132415771484375, 0.23302459716796875, 0.2528076171875, 0.27259063720703125, 0.2923736572265625, 0.31215667724609375, 0.331939697265625, 0.35172271728515625, 0.3715057373046875, 0.39128875732421875, 0.41107177734375, 0.43085479736328125, 0.4506378173828125, 0.47042083740234375, 0.490203857421875, 0.5099868774414062, 0.5297698974609375, 0.5495529174804688, 0.5693359375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 6.0, 23.0, 44.0, 87.0, 148.0, 228.0, 206.0, 104.0, 63.0, 31.0, 16.0, 8.0, 9.0, 1.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0002803802490234375, -0.0002718120813369751, -0.0002632439136505127, -0.0002546757459640503, -0.0002461075782775879, -0.0002375394105911255, -0.00022897124290466309, -0.00022040307521820068, -0.00021183490753173828, -0.00020326673984527588, -0.00019469857215881348, -0.00018613040447235107, -0.00017756223678588867, -0.00016899406909942627, -0.00016042590141296387, -0.00015185773372650146, -0.00014328956604003906, -0.00013472139835357666, -0.00012615323066711426, -0.00011758506298065186, -0.00010901689529418945, -0.00010044872760772705, -9.188055992126465e-05, -8.331239223480225e-05, -7.474422454833984e-05, -6.617605686187744e-05, -5.760788917541504e-05, -4.903972148895264e-05, -4.0471553802490234e-05, -3.190338611602783e-05, -2.333521842956543e-05, -1.4767050743103027e-05, -6.198883056640625e-06, 2.3692846298217773e-06, 1.093745231628418e-05, 1.9505620002746582e-05, 2.8073787689208984e-05, 3.664195537567139e-05, 4.521012306213379e-05, 5.377829074859619e-05, 6.23464584350586e-05, 7.0914626121521e-05, 7.94827938079834e-05, 8.80509614944458e-05, 9.66191291809082e-05, 0.0001051872968673706, 0.00011375546455383301, 0.0001223236322402954, 0.0001308917999267578, 0.00013945996761322021, 0.00014802813529968262, 0.00015659630298614502, 0.00016516447067260742, 0.00017373263835906982, 0.00018230080604553223, 0.00019086897373199463, 0.00019943714141845703, 0.00020800530910491943, 0.00021657347679138184, 0.00022514164447784424, 0.00023370981216430664, 0.00024227797985076904, 0.00025084614753723145, 0.00025941431522369385, 0.00026798248291015625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 10.0, 12.0, 8.0, 17.0, 18.0, 28.0, 32.0, 55.0, 57.0, 97.0, 140.0, 248.0, 357.0, 718.0, 1353.0, 2725.0, 6610.0, 19690.0, 91863.0, 750721.0, 133527.0, 25694.0, 7957.0, 3145.0, 1500.0, 707.0, 427.0, 258.0, 179.0, 115.0, 82.0, 40.0, 39.0, 35.0, 15.0, 26.0, 10.0, 9.0, 4.0, 5.0, 8.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5419921875, -0.5258598327636719, -0.5097274780273438, -0.4935951232910156, -0.4774627685546875, -0.4613304138183594, -0.44519805908203125, -0.4290657043457031, -0.412933349609375, -0.3968009948730469, -0.38066864013671875, -0.3645362854003906, -0.3484039306640625, -0.3322715759277344, -0.31613922119140625, -0.3000068664550781, -0.28387451171875, -0.2677421569824219, -0.25160980224609375, -0.23547744750976562, -0.2193450927734375, -0.20321273803710938, -0.18708038330078125, -0.17094802856445312, -0.154815673828125, -0.13868331909179688, -0.12255096435546875, -0.10641860961914062, -0.0902862548828125, -0.07415390014648438, -0.05802154541015625, -0.041889190673828125, -0.0257568359375, -0.009624481201171875, 0.00650787353515625, 0.022640228271484375, 0.0387725830078125, 0.054904937744140625, 0.07103729248046875, 0.08716964721679688, 0.103302001953125, 0.11943435668945312, 0.13556671142578125, 0.15169906616210938, 0.1678314208984375, 0.18396377563476562, 0.20009613037109375, 0.21622848510742188, 0.23236083984375, 0.24849319458007812, 0.26462554931640625, 0.2807579040527344, 0.2968902587890625, 0.3130226135253906, 0.32915496826171875, 0.3452873229980469, 0.361419677734375, 0.3775520324707031, 0.39368438720703125, 0.4098167419433594, 0.4259490966796875, 0.4420814514160156, 0.45821380615234375, 0.4743461608886719, 0.490478515625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 0.0, 3.0, 3.0, 8.0, 2.0, 4.0, 7.0, 10.0, 6.0, 19.0, 18.0, 22.0, 38.0, 57.0, 71.0, 89.0, 95.0, 129.0, 99.0, 71.0, 63.0, 46.0, 27.0, 21.0, 19.0, 23.0, 5.0, 6.0, 8.0, 4.0, 3.0, 6.0, 2.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.7275390625, -0.7084617614746094, -0.6893844604492188, -0.6703071594238281, -0.6512298583984375, -0.6321525573730469, -0.6130752563476562, -0.5939979553222656, -0.574920654296875, -0.5558433532714844, -0.5367660522460938, -0.5176887512207031, -0.4986114501953125, -0.4795341491699219, -0.46045684814453125, -0.4413795471191406, -0.42230224609375, -0.4032249450683594, -0.38414764404296875, -0.3650703430175781, -0.3459930419921875, -0.3269157409667969, -0.30783843994140625, -0.2887611389160156, -0.269683837890625, -0.2506065368652344, -0.23152923583984375, -0.21245193481445312, -0.1933746337890625, -0.17429733276367188, -0.15522003173828125, -0.13614273071289062, -0.1170654296875, -0.09798812866210938, -0.07891082763671875, -0.059833526611328125, -0.0407562255859375, -0.021678924560546875, -0.00260162353515625, 0.016475677490234375, 0.035552978515625, 0.054630279541015625, 0.07370758056640625, 0.09278488159179688, 0.1118621826171875, 0.13093948364257812, 0.15001678466796875, 0.16909408569335938, 0.18817138671875, 0.20724868774414062, 0.22632598876953125, 0.24540328979492188, 0.2644805908203125, 0.2835578918457031, 0.30263519287109375, 0.3217124938964844, 0.340789794921875, 0.3598670959472656, 0.37894439697265625, 0.3980216979980469, 0.4170989990234375, 0.4361763000488281, 0.45525360107421875, 0.4743309020996094, 0.493408203125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 24.0, 44.0, 118.0, 283.0, 407.0, 76.0, 26.0, 9.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.2901668548584, -18.490123748779297, -17.690080642700195, -16.890037536621094, -16.089994430541992, -15.28995132446289, -14.489907264709473, -13.689864158630371, -12.88982105255127, -12.089777946472168, -11.289734840393066, -10.489690780639648, -9.689647674560547, -8.889604568481445, -8.089561462402344, -7.289518356323242, -6.489475250244141, -5.689432144165039, -4.8893890380859375, -4.089345455169678, -3.289302349090576, -2.4892592430114746, -1.6892156600952148, -0.8891725540161133, -0.08912944793701172, 0.7109137773513794, 1.5109570026397705, 2.311000347137451, 3.1110434532165527, 3.9110865592956543, 4.711130142211914, 5.511173248291016, 6.31121826171875, 7.111261367797852, 7.911304473876953, 8.711347579956055, 9.511390686035156, 10.311433792114258, 11.111477851867676, 11.911520957946777, 12.711564064025879, 13.51160717010498, 14.311650276184082, 15.1116943359375, 15.911737442016602, 16.711780548095703, 17.511823654174805, 18.311866760253906, 19.111909866333008, 19.91195297241211, 20.71199607849121, 21.512039184570312, 22.312082290649414, 23.112125396728516, 23.91217041015625, 24.71221160888672, 25.512256622314453, 26.312299728393555, 27.112342834472656, 27.912385940551758, 28.71242904663086, 29.51247215270996, 30.312515258789062, 31.112560272216797, 31.912601470947266]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 6.0, 4.0, 5.0, 13.0, 3.0, 7.0, 10.0, 14.0, 12.0, 22.0, 12.0, 20.0, 28.0, 34.0, 27.0, 29.0, 35.0, 40.0, 73.0, 130.0, 116.0, 54.0, 40.0, 31.0, 27.0, 20.0, 25.0, 20.0, 15.0, 16.0, 14.0, 14.0, 15.0, 14.0, 12.0, 12.0, 4.0, 2.0, 5.0, 7.0, 5.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.189980506896973, -13.757020950317383, -13.324061393737793, -12.891101837158203, -12.458141326904297, -12.025181770324707, -11.592222213745117, -11.159262657165527, -10.726303100585938, -10.293343544006348, -9.860383987426758, -9.427423477172852, -8.994463920593262, -8.561504364013672, -8.128544807434082, -7.695585250854492, -7.262625217437744, -6.829665660858154, -6.396705627441406, -5.963746070861816, -5.530786514282227, -5.097826957702637, -4.664866924285889, -4.231907367706299, -3.79894757270813, -3.365987777709961, -2.933028221130371, -2.500068426132202, -2.067108631134033, -1.6341490745544434, -1.2011892795562744, -0.7682297229766846, -0.3352699279785156, 0.09768977761268616, 0.5306494832038879, 0.9636092185974121, 1.3965688943862915, 1.829528570175171, 2.26248836517334, 2.6954479217529297, 3.1284077167510986, 3.5613675117492676, 3.9943270683288574, 4.4272871017456055, 4.860246658325195, 5.293206214904785, 5.726165771484375, 6.159125328063965, 6.592085361480713, 7.025044918060303, 7.458004951477051, 7.890964508056641, 8.32392406463623, 8.75688362121582, 9.189844131469727, 9.622802734375, 10.055763244628906, 10.488722801208496, 10.921682357788086, 11.354642868041992, 11.787602424621582, 12.220561981201172, 12.653521537780762, 13.086481094360352, 13.519440650939941]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 4.0, 12.0, 27.0, 32.0, 42.0, 71.0, 93.0, 165.0, 251.0, 426.0, 724.0, 1185.0, 2187.0, 4302.0, 9410.0, 23972.0, 72996.0, 282882.0, 1050155.0, 1733856.0, 749005.0, 184815.0, 47821.0, 15511.0, 6538.0, 3331.0, 1650.0, 1050.0, 622.0, 358.0, 234.0, 177.0, 98.0, 61.0, 43.0, 36.0, 30.0, 34.0, 17.0, 14.0, 10.0, 9.0, 8.0, 4.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.83447265625, -0.806976318359375, -0.77947998046875, -0.751983642578125, -0.7244873046875, -0.696990966796875, -0.66949462890625, -0.641998291015625, -0.614501953125, -0.587005615234375, -0.55950927734375, -0.532012939453125, -0.5045166015625, -0.477020263671875, -0.44952392578125, -0.422027587890625, -0.39453125, -0.367034912109375, -0.33953857421875, -0.312042236328125, -0.2845458984375, -0.257049560546875, -0.22955322265625, -0.202056884765625, -0.174560546875, -0.147064208984375, -0.11956787109375, -0.092071533203125, -0.0645751953125, -0.037078857421875, -0.00958251953125, 0.017913818359375, 0.04541015625, 0.072906494140625, 0.10040283203125, 0.127899169921875, 0.1553955078125, 0.182891845703125, 0.21038818359375, 0.237884521484375, 0.265380859375, 0.292877197265625, 0.32037353515625, 0.347869873046875, 0.3753662109375, 0.402862548828125, 0.43035888671875, 0.457855224609375, 0.4853515625, 0.512847900390625, 0.54034423828125, 0.567840576171875, 0.5953369140625, 0.622833251953125, 0.65032958984375, 0.677825927734375, 0.705322265625, 0.732818603515625, 0.76031494140625, 0.787811279296875, 0.8153076171875, 0.842803955078125, 0.87030029296875, 0.897796630859375, 0.92529296875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 8.0, 9.0, 5.0, 14.0, 14.0, 24.0, 28.0, 28.0, 40.0, 46.0, 58.0, 68.0, 57.0, 64.0, 62.0, 65.0, 59.0, 72.0, 61.0, 46.0, 38.0, 38.0, 22.0, 17.0, 12.0, 11.0, 10.0, 4.0, 7.0, 2.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81591796875, -0.7862014770507812, -0.7564849853515625, -0.7267684936523438, -0.697052001953125, -0.6673355102539062, -0.6376190185546875, -0.6079025268554688, -0.57818603515625, -0.5484695434570312, -0.5187530517578125, -0.48903656005859375, -0.459320068359375, -0.42960357666015625, -0.3998870849609375, -0.37017059326171875, -0.3404541015625, -0.31073760986328125, -0.2810211181640625, -0.25130462646484375, -0.221588134765625, -0.19187164306640625, -0.1621551513671875, -0.13243865966796875, -0.10272216796875, -0.07300567626953125, -0.0432891845703125, -0.01357269287109375, 0.016143798828125, 0.04586029052734375, 0.0755767822265625, 0.10529327392578125, 0.135009765625, 0.16472625732421875, 0.1944427490234375, 0.22415924072265625, 0.253875732421875, 0.28359222412109375, 0.3133087158203125, 0.34302520751953125, 0.37274169921875, 0.40245819091796875, 0.4321746826171875, 0.46189117431640625, 0.491607666015625, 0.5213241577148438, 0.5510406494140625, 0.5807571411132812, 0.6104736328125, 0.6401901245117188, 0.6699066162109375, 0.6996231079101562, 0.729339599609375, 0.7590560913085938, 0.7887725830078125, 0.8184890747070312, 0.84820556640625, 0.8779220581054688, 0.9076385498046875, 0.9373550415039062, 0.967071533203125, 0.9967880249023438, 1.0265045166015625, 1.0562210083007812, 1.0859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 16.0, 18.0, 23.0, 34.0, 59.0, 113.0, 268.0, 569.0, 1549.0, 7649.0, 1333018.0, 2839219.0, 8755.0, 1739.0, 611.0, 272.0, 133.0, 87.0, 51.0, 20.0, 23.0, 14.0, 14.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.203125, -5.99658203125, -5.7900390625, -5.58349609375, -5.376953125, -5.17041015625, -4.9638671875, -4.75732421875, -4.55078125, -4.34423828125, -4.1376953125, -3.93115234375, -3.724609375, -3.51806640625, -3.3115234375, -3.10498046875, -2.8984375, -2.69189453125, -2.4853515625, -2.27880859375, -2.072265625, -1.86572265625, -1.6591796875, -1.45263671875, -1.24609375, -1.03955078125, -0.8330078125, -0.62646484375, -0.419921875, -0.21337890625, -0.0068359375, 0.19970703125, 0.40625, 0.61279296875, 0.8193359375, 1.02587890625, 1.232421875, 1.43896484375, 1.6455078125, 1.85205078125, 2.05859375, 2.26513671875, 2.4716796875, 2.67822265625, 2.884765625, 3.09130859375, 3.2978515625, 3.50439453125, 3.7109375, 3.91748046875, 4.1240234375, 4.33056640625, 4.537109375, 4.74365234375, 4.9501953125, 5.15673828125, 5.36328125, 5.56982421875, 5.7763671875, 5.98291015625, 6.189453125, 6.39599609375, 6.6025390625, 6.80908203125, 7.015625]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 12.0, 13.0, 19.0, 23.0, 34.0, 59.0, 76.0, 120.0, 190.0, 364.0, 538.0, 743.0, 655.0, 468.0, 304.0, 141.0, 92.0, 66.0, 45.0, 21.0, 29.0, 19.0, 11.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.205078125, -3.112945556640625, -3.02081298828125, -2.928680419921875, -2.8365478515625, -2.744415283203125, -2.65228271484375, -2.560150146484375, -2.468017578125, -2.375885009765625, -2.28375244140625, -2.191619873046875, -2.0994873046875, -2.007354736328125, -1.91522216796875, -1.823089599609375, -1.73095703125, -1.638824462890625, -1.54669189453125, -1.454559326171875, -1.3624267578125, -1.270294189453125, -1.17816162109375, -1.086029052734375, -0.993896484375, -0.901763916015625, -0.80963134765625, -0.717498779296875, -0.6253662109375, -0.533233642578125, -0.44110107421875, -0.348968505859375, -0.2568359375, -0.164703369140625, -0.07257080078125, 0.019561767578125, 0.1116943359375, 0.203826904296875, 0.29595947265625, 0.388092041015625, 0.480224609375, 0.572357177734375, 0.66448974609375, 0.756622314453125, 0.8487548828125, 0.940887451171875, 1.03302001953125, 1.125152587890625, 1.21728515625, 1.309417724609375, 1.40155029296875, 1.493682861328125, 1.5858154296875, 1.677947998046875, 1.77008056640625, 1.862213134765625, 1.954345703125, 2.046478271484375, 2.13861083984375, 2.230743408203125, 2.3228759765625, 2.415008544921875, 2.50714111328125, 2.599273681640625, 2.69140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 7.0, 5.0, 13.0, 24.0, 63.0, 116.0, 234.0, 230.0, 151.0, 63.0, 34.0, 12.0, 8.0, 10.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.776268005371094, -19.633508682250977, -18.490751266479492, -17.347991943359375, -16.205232620239258, -15.062474250793457, -13.919715881347656, -12.776956558227539, -11.634198188781738, -10.491439819335938, -9.34868049621582, -8.20592212677002, -7.0631632804870605, -5.920404434204102, -4.777646064758301, -3.634887218475342, -2.492128372192383, -1.3493696451187134, -0.20661091804504395, 0.9361476898193359, 2.078906536102295, 3.221665382385254, 4.364423751831055, 5.507182598114014, 6.649941444396973, 7.792700290679932, 8.93545913696289, 10.078217506408691, 11.220975875854492, 12.36373519897461, 13.50649356842041, 14.649251937866211, 15.792011260986328, 16.934770584106445, 18.07752799987793, 19.220287322998047, 20.363046646118164, 21.50580596923828, 22.648563385009766, 23.791322708129883, 24.93408203125, 26.076841354370117, 27.2195987701416, 28.36235809326172, 29.505117416381836, 30.647876739501953, 31.790634155273438, 32.93339157104492, 34.076148986816406, 35.21890640258789, 36.36166763305664, 37.504425048828125, 38.64718246459961, 39.78994369506836, 40.932701110839844, 42.07545852661133, 43.21821975708008, 44.36097717285156, 45.50373840332031, 46.6464958190918, 47.78925323486328, 48.93201446533203, 50.074771881103516, 51.217529296875, 52.36029052734375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 6.0, 0.0, 4.0, 12.0, 7.0, 13.0, 13.0, 21.0, 17.0, 28.0, 33.0, 45.0, 55.0, 54.0, 73.0, 80.0, 86.0, 78.0, 56.0, 68.0, 54.0, 36.0, 33.0, 32.0, 31.0, 21.0, 11.0, 11.0, 4.0, 6.0, 2.0, 4.0, 4.0, 7.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.300798416137695, -22.695552825927734, -22.09030532836914, -21.48505973815918, -20.879812240600586, -20.274566650390625, -19.66931915283203, -19.06407356262207, -18.458826065063477, -17.853580474853516, -17.248332977294922, -16.64308738708496, -16.037839889526367, -15.43259334564209, -14.827346801757812, -14.222101211547852, -13.616854667663574, -13.011608123779297, -12.40636157989502, -11.801115036010742, -11.195868492126465, -10.590621948242188, -9.985376358032227, -9.380128860473633, -8.774883270263672, -8.169636726379395, -7.564390182495117, -6.95914363861084, -6.3538970947265625, -5.748650550842285, -5.143404483795166, -4.538157939910889, -3.9329118728637695, -3.327665328979492, -2.722418785095215, -2.1171724796295166, -1.5119259357452393, -0.9066793918609619, -0.30143308639526367, 0.30381345748901367, 0.909060001373291, 1.5143065452575684, 2.1195530891418457, 2.724799394607544, 3.3300459384918213, 3.9352924823760986, 4.540538787841797, 5.145785331726074, 5.751031875610352, 6.356278419494629, 6.961524963378906, 7.566771507263184, 8.172018051147461, 8.777264595031738, 9.382511138916016, 9.987756729125977, 10.59300422668457, 11.198250770568848, 11.803497314453125, 12.408743858337402, 13.01399040222168, 13.619236946105957, 14.224483489990234, 14.829729080200195, 15.434975624084473]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 8.0, 5.0, 7.0, 18.0, 18.0, 29.0, 48.0, 83.0, 181.0, 255.0, 571.0, 1209.0, 3128.0, 9243.0, 38794.0, 311268.0, 603262.0, 60513.0, 12992.0, 3937.0, 1536.0, 670.0, 348.0, 191.0, 88.0, 63.0, 43.0, 15.0, 11.0, 11.0, 8.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.298828125, -1.249114990234375, -1.19940185546875, -1.149688720703125, -1.0999755859375, -1.050262451171875, -1.00054931640625, -0.950836181640625, -0.901123046875, -0.851409912109375, -0.80169677734375, -0.751983642578125, -0.7022705078125, -0.652557373046875, -0.60284423828125, -0.553131103515625, -0.50341796875, -0.453704833984375, -0.40399169921875, -0.354278564453125, -0.3045654296875, -0.254852294921875, -0.20513916015625, -0.155426025390625, -0.105712890625, -0.055999755859375, -0.00628662109375, 0.043426513671875, 0.0931396484375, 0.142852783203125, 0.19256591796875, 0.242279052734375, 0.2919921875, 0.341705322265625, 0.39141845703125, 0.441131591796875, 0.4908447265625, 0.540557861328125, 0.59027099609375, 0.639984130859375, 0.689697265625, 0.739410400390625, 0.78912353515625, 0.838836669921875, 0.8885498046875, 0.938262939453125, 0.98797607421875, 1.037689208984375, 1.08740234375, 1.137115478515625, 1.18682861328125, 1.236541748046875, 1.2862548828125, 1.335968017578125, 1.38568115234375, 1.435394287109375, 1.485107421875, 1.534820556640625, 1.58453369140625, 1.634246826171875, 1.6839599609375, 1.733673095703125, 1.78338623046875, 1.833099365234375, 1.8828125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 5.0, 4.0, 4.0, 7.0, 4.0, 12.0, 12.0, 19.0, 16.0, 16.0, 21.0, 28.0, 32.0, 33.0, 39.0, 45.0, 37.0, 49.0, 50.0, 60.0, 59.0, 41.0, 54.0, 47.0, 52.0, 40.0, 55.0, 36.0, 21.0, 31.0, 13.0, 13.0, 15.0, 5.0, 12.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92626953125, -0.8953781127929688, -0.8644866943359375, -0.8335952758789062, -0.802703857421875, -0.7718124389648438, -0.7409210205078125, -0.7100296020507812, -0.67913818359375, -0.6482467651367188, -0.6173553466796875, -0.5864639282226562, -0.555572509765625, -0.5246810913085938, -0.4937896728515625, -0.46289825439453125, -0.4320068359375, -0.40111541748046875, -0.3702239990234375, -0.33933258056640625, -0.308441162109375, -0.27754974365234375, -0.2466583251953125, -0.21576690673828125, -0.18487548828125, -0.15398406982421875, -0.1230926513671875, -0.09220123291015625, -0.061309814453125, -0.03041839599609375, 0.0004730224609375, 0.03136444091796875, 0.062255859375, 0.09314727783203125, 0.1240386962890625, 0.15493011474609375, 0.185821533203125, 0.21671295166015625, 0.2476043701171875, 0.27849578857421875, 0.30938720703125, 0.34027862548828125, 0.3711700439453125, 0.40206146240234375, 0.432952880859375, 0.46384429931640625, 0.4947357177734375, 0.5256271362304688, 0.5565185546875, 0.5874099731445312, 0.6183013916015625, 0.6491928100585938, 0.680084228515625, 0.7109756469726562, 0.7418670654296875, 0.7727584838867188, 0.80364990234375, 0.8345413208007812, 0.8654327392578125, 0.8963241577148438, 0.927215576171875, 0.9581069946289062, 0.9889984130859375, 1.0198898315429688, 1.05078125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 7.0, 5.0, 11.0, 7.0, 15.0, 16.0, 22.0, 26.0, 37.0, 64.0, 85.0, 114.0, 207.0, 395.0, 795.0, 2245.0, 11086.0, 142636.0, 860704.0, 23911.0, 3766.0, 1161.0, 503.0, 255.0, 139.0, 95.0, 69.0, 60.0, 35.0, 14.0, 14.0, 19.0, 9.0, 6.0, 6.0, 6.0, 5.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.76287841796875, -1.7044677734375, -1.64605712890625, -1.587646484375, -1.52923583984375, -1.4708251953125, -1.41241455078125, -1.35400390625, -1.29559326171875, -1.2371826171875, -1.17877197265625, -1.120361328125, -1.06195068359375, -1.0035400390625, -0.94512939453125, -0.88671875, -0.82830810546875, -0.7698974609375, -0.71148681640625, -0.653076171875, -0.59466552734375, -0.5362548828125, -0.47784423828125, -0.41943359375, -0.36102294921875, -0.3026123046875, -0.24420166015625, -0.185791015625, -0.12738037109375, -0.0689697265625, -0.01055908203125, 0.0478515625, 0.10626220703125, 0.1646728515625, 0.22308349609375, 0.281494140625, 0.33990478515625, 0.3983154296875, 0.45672607421875, 0.51513671875, 0.57354736328125, 0.6319580078125, 0.69036865234375, 0.748779296875, 0.80718994140625, 0.8656005859375, 0.92401123046875, 0.982421875, 1.04083251953125, 1.0992431640625, 1.15765380859375, 1.216064453125, 1.27447509765625, 1.3328857421875, 1.39129638671875, 1.44970703125, 1.50811767578125, 1.5665283203125, 1.62493896484375, 1.683349609375, 1.74176025390625, 1.8001708984375, 1.85858154296875, 1.9169921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 1.0, 5.0, 5.0, 1.0, 11.0, 5.0, 7.0, 16.0, 9.0, 17.0, 20.0, 14.0, 29.0, 31.0, 34.0, 25.0, 37.0, 54.0, 51.0, 64.0, 74.0, 59.0, 66.0, 50.0, 39.0, 34.0, 41.0, 26.0, 22.0, 30.0, 22.0, 12.0, 15.0, 14.0, 10.0, 7.0, 7.0, 1.0, 4.0, 5.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.048828125, -2.95843505859375, -2.8680419921875, -2.77764892578125, -2.687255859375, -2.59686279296875, -2.5064697265625, -2.41607666015625, -2.32568359375, -2.23529052734375, -2.1448974609375, -2.05450439453125, -1.964111328125, -1.87371826171875, -1.7833251953125, -1.69293212890625, -1.6025390625, -1.51214599609375, -1.4217529296875, -1.33135986328125, -1.240966796875, -1.15057373046875, -1.0601806640625, -0.96978759765625, -0.87939453125, -0.78900146484375, -0.6986083984375, -0.60821533203125, -0.517822265625, -0.42742919921875, -0.3370361328125, -0.24664306640625, -0.15625, -0.06585693359375, 0.0245361328125, 0.11492919921875, 0.205322265625, 0.29571533203125, 0.3861083984375, 0.47650146484375, 0.56689453125, 0.65728759765625, 0.7476806640625, 0.83807373046875, 0.928466796875, 1.01885986328125, 1.1092529296875, 1.19964599609375, 1.2900390625, 1.38043212890625, 1.4708251953125, 1.56121826171875, 1.651611328125, 1.74200439453125, 1.8323974609375, 1.92279052734375, 2.01318359375, 2.10357666015625, 2.1939697265625, 2.28436279296875, 2.374755859375, 2.46514892578125, 2.5555419921875, 2.64593505859375, 2.736328125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 7.0, 12.0, 10.0, 11.0, 25.0, 35.0, 47.0, 88.0, 135.0, 290.0, 573.0, 1511.0, 4477.0, 21951.0, 793209.0, 203291.0, 16672.0, 3866.0, 1207.0, 497.0, 274.0, 128.0, 72.0, 47.0, 40.0, 20.0, 17.0, 8.0, 6.0, 8.0, 3.0, 6.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36083984375, -0.3487815856933594, -0.33672332763671875, -0.3246650695800781, -0.3126068115234375, -0.3005485534667969, -0.28849029541015625, -0.2764320373535156, -0.264373779296875, -0.2523155212402344, -0.24025726318359375, -0.22819900512695312, -0.2161407470703125, -0.20408248901367188, -0.19202423095703125, -0.17996597290039062, -0.16790771484375, -0.15584945678710938, -0.14379119873046875, -0.13173294067382812, -0.1196746826171875, -0.10761642456054688, -0.09555816650390625, -0.08349990844726562, -0.071441650390625, -0.059383392333984375, -0.04732513427734375, -0.035266876220703125, -0.0232086181640625, -0.011150360107421875, 0.00090789794921875, 0.012966156005859375, 0.0250244140625, 0.037082672119140625, 0.04914093017578125, 0.061199188232421875, 0.0732574462890625, 0.08531570434570312, 0.09737396240234375, 0.10943222045898438, 0.121490478515625, 0.13354873657226562, 0.14560699462890625, 0.15766525268554688, 0.1697235107421875, 0.18178176879882812, 0.19384002685546875, 0.20589828491210938, 0.21795654296875, 0.23001480102539062, 0.24207305908203125, 0.2541313171386719, 0.2661895751953125, 0.2782478332519531, 0.29030609130859375, 0.3023643493652344, 0.314422607421875, 0.3264808654785156, 0.33853912353515625, 0.3505973815917969, 0.3626556396484375, 0.3747138977050781, 0.38677215576171875, 0.3988304138183594, 0.410888671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 5.0, 10.0, 4.0, 8.0, 9.0, 11.0, 19.0, 18.0, 35.0, 47.0, 85.0, 114.0, 143.0, 141.0, 105.0, 65.0, 39.0, 28.0, 28.0, 20.0, 6.0, 8.0, 9.0, 6.0, 8.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.936094284057617e-05, -9.642355144023895e-05, -9.348616003990173e-05, -9.054876863956451e-05, -8.76113772392273e-05, -8.467398583889008e-05, -8.173659443855286e-05, -7.879920303821564e-05, -7.586181163787842e-05, -7.29244202375412e-05, -6.998702883720398e-05, -6.704963743686676e-05, -6.411224603652954e-05, -6.117485463619232e-05, -5.82374632358551e-05, -5.530007183551788e-05, -5.2362680435180664e-05, -4.9425289034843445e-05, -4.6487897634506226e-05, -4.3550506234169006e-05, -4.061311483383179e-05, -3.767572343349457e-05, -3.473833203315735e-05, -3.180094063282013e-05, -2.886354923248291e-05, -2.592615783214569e-05, -2.298876643180847e-05, -2.0051375031471252e-05, -1.7113983631134033e-05, -1.4176592230796814e-05, -1.1239200830459595e-05, -8.301809430122375e-06, -5.364418029785156e-06, -2.427026629447937e-06, 5.103647708892822e-07, 3.4477561712265015e-06, 6.385147571563721e-06, 9.32253897190094e-06, 1.225993037223816e-05, 1.5197321772575378e-05, 1.8134713172912598e-05, 2.1072104573249817e-05, 2.4009495973587036e-05, 2.6946887373924255e-05, 2.9884278774261475e-05, 3.2821670174598694e-05, 3.575906157493591e-05, 3.869645297527313e-05, 4.163384437561035e-05, 4.457123577594757e-05, 4.750862717628479e-05, 5.044601857662201e-05, 5.338340997695923e-05, 5.632080137729645e-05, 5.925819277763367e-05, 6.219558417797089e-05, 6.51329755783081e-05, 6.807036697864532e-05, 7.100775837898254e-05, 7.394514977931976e-05, 7.688254117965698e-05, 7.98199325799942e-05, 8.275732398033142e-05, 8.569471538066864e-05, 8.863210678100586e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 6.0, 8.0, 11.0, 18.0, 18.0, 24.0, 33.0, 42.0, 84.0, 133.0, 192.0, 359.0, 607.0, 1088.0, 2296.0, 4902.0, 11745.0, 35043.0, 289425.0, 642799.0, 37100.0, 12505.0, 5054.0, 2313.0, 1139.0, 615.0, 375.0, 202.0, 128.0, 90.0, 55.0, 47.0, 28.0, 14.0, 16.0, 13.0, 6.0, 7.0, 7.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2454833984375, -0.23756980895996094, -0.22965621948242188, -0.2217426300048828, -0.21382904052734375, -0.2059154510498047, -0.19800186157226562, -0.19008827209472656, -0.1821746826171875, -0.17426109313964844, -0.16634750366210938, -0.1584339141845703, -0.15052032470703125, -0.1426067352294922, -0.13469314575195312, -0.12677955627441406, -0.118865966796875, -0.11095237731933594, -0.10303878784179688, -0.09512519836425781, -0.08721160888671875, -0.07929801940917969, -0.07138442993164062, -0.06347084045410156, -0.0555572509765625, -0.04764366149902344, -0.039730072021484375, -0.03181648254394531, -0.02390289306640625, -0.015989303588867188, -0.008075714111328125, -0.0001621246337890625, 0.00775146484375, 0.015665054321289062, 0.023578643798828125, 0.03149223327636719, 0.03940582275390625, 0.04731941223144531, 0.055233001708984375, 0.06314659118652344, 0.0710601806640625, 0.07897377014160156, 0.08688735961914062, 0.09480094909667969, 0.10271453857421875, 0.11062812805175781, 0.11854171752929688, 0.12645530700683594, 0.134368896484375, 0.14228248596191406, 0.15019607543945312, 0.1581096649169922, 0.16602325439453125, 0.1739368438720703, 0.18185043334960938, 0.18976402282714844, 0.1976776123046875, 0.20559120178222656, 0.21350479125976562, 0.2214183807373047, 0.22933197021484375, 0.2372455596923828, 0.24515914916992188, 0.25307273864746094, 0.260986328125]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 4.0, 0.0, 4.0, 4.0, 2.0, 9.0, 10.0, 17.0, 14.0, 31.0, 27.0, 40.0, 62.0, 91.0, 116.0, 132.0, 117.0, 85.0, 58.0, 46.0, 27.0, 23.0, 14.0, 12.0, 14.0, 10.0, 4.0, 2.0, 6.0, 3.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.31591796875, -0.30438995361328125, -0.2928619384765625, -0.28133392333984375, -0.269805908203125, -0.25827789306640625, -0.2467498779296875, -0.23522186279296875, -0.22369384765625, -0.21216583251953125, -0.2006378173828125, -0.18910980224609375, -0.177581787109375, -0.16605377197265625, -0.1545257568359375, -0.14299774169921875, -0.1314697265625, -0.11994171142578125, -0.1084136962890625, -0.09688568115234375, -0.085357666015625, -0.07382965087890625, -0.0623016357421875, -0.05077362060546875, -0.03924560546875, -0.02771759033203125, -0.0161895751953125, -0.00466156005859375, 0.006866455078125, 0.01839447021484375, 0.0299224853515625, 0.04145050048828125, 0.052978515625, 0.06450653076171875, 0.0760345458984375, 0.08756256103515625, 0.099090576171875, 0.11061859130859375, 0.1221466064453125, 0.13367462158203125, 0.14520263671875, 0.15673065185546875, 0.1682586669921875, 0.17978668212890625, 0.191314697265625, 0.20284271240234375, 0.2143707275390625, 0.22589874267578125, 0.2374267578125, 0.24895477294921875, 0.2604827880859375, 0.27201080322265625, 0.283538818359375, 0.29506683349609375, 0.3065948486328125, 0.31812286376953125, 0.32965087890625, 0.34117889404296875, 0.3527069091796875, 0.36423492431640625, 0.375762939453125, 0.38729095458984375, 0.3988189697265625, 0.41034698486328125, 0.421875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 2.0, 6.0, 16.0, 35.0, 69.0, 249.0, 426.0, 91.0, 54.0, 20.0, 14.0, 9.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.628650665283203, -19.100866317749023, -18.573083877563477, -18.045299530029297, -17.517515182495117, -16.989730834960938, -16.46194839477539, -15.934164047241211, -15.406380653381348, -14.878597259521484, -14.350812911987305, -13.823029518127441, -13.295246124267578, -12.767461776733398, -12.239678382873535, -11.711894989013672, -11.184110641479492, -10.656327247619629, -10.12854290008545, -9.600759506225586, -9.072975158691406, -8.545191764831543, -8.01740837097168, -7.489624500274658, -6.961840629577637, -6.434056758880615, -5.906272888183594, -5.3784894943237305, -4.850705623626709, -4.3229217529296875, -3.795138120651245, -3.2673544883728027, -2.7395687103271484, -2.211784839630127, -1.6840012073516846, -1.1562174558639526, -0.6284337043762207, -0.10064983367919922, 0.42713379859924316, 0.9549174308776855, 1.482701301574707, 2.0104851722717285, 2.538268804550171, 3.0660524368286133, 3.5938363075256348, 4.121620178222656, 4.6494035720825195, 5.177187442779541, 5.7049713134765625, 6.232755184173584, 6.7605390548706055, 7.288322448730469, 7.81610631942749, 8.343890190124512, 8.871673583984375, 9.399457931518555, 9.927241325378418, 10.455024719238281, 10.982809066772461, 11.510592460632324, 12.038375854492188, 12.566160202026367, 13.09394359588623, 13.621726989746094, 14.149511337280273]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 6.0, 6.0, 4.0, 8.0, 14.0, 6.0, 14.0, 9.0, 10.0, 10.0, 13.0, 21.0, 25.0, 16.0, 23.0, 59.0, 133.0, 125.0, 123.0, 122.0, 38.0, 24.0, 31.0, 21.0, 20.0, 21.0, 14.0, 10.0, 9.0, 11.0, 11.0, 4.0, 11.0, 6.0, 4.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.117767333984375, -8.831701278686523, -8.545635223388672, -8.25956916809082, -7.973503589630127, -7.687437534332275, -7.401371479034424, -7.1153059005737305, -6.829239845275879, -6.543173789978027, -6.257107734680176, -5.971041679382324, -5.684976100921631, -5.398910045623779, -5.112843990325928, -4.826778411865234, -4.540711879730225, -4.254645824432373, -3.9685800075531006, -3.682513952255249, -3.3964481353759766, -3.110382080078125, -2.8243160247802734, -2.538250207901001, -2.2521841526031494, -1.9661182165145874, -1.6800522804260254, -1.3939862251281738, -1.1079202890396118, -0.8218543529510498, -0.5357882976531982, -0.24972248077392578, 0.03634357452392578, 0.3224095404148102, 0.6084755063056946, 0.8945415019989014, 1.1806074380874634, 1.4666733741760254, 1.752739429473877, 2.0388052463531494, 2.324871301651001, 2.6109373569488525, 2.897003173828125, 3.1830692291259766, 3.469135284423828, 3.7552011013031006, 4.041267395019531, 4.327332973480225, 4.613399028778076, 4.899465084075928, 5.185531139373779, 5.471596717834473, 5.757662773132324, 6.043728828430176, 6.329794883728027, 6.615860939025879, 6.9019269943237305, 7.187993049621582, 7.474059104919434, 7.760125160217285, 8.046191215515137, 8.332256317138672, 8.618322372436523, 8.904388427734375, 9.190454483032227]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 7.0, 4.0, 7.0, 9.0, 6.0, 14.0, 9.0, 16.0, 17.0, 19.0, 32.0, 32.0, 33.0, 38.0, 43.0, 105.0, 224.0, 86.0, 34.0, 35.0, 38.0, 40.0, 28.0, 20.0, 22.0, 16.0, 10.0, 16.0, 6.0, 8.0, 5.0, 4.0, 3.0, 3.0, 7.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80712890625, -0.7777786254882812, -0.7484283447265625, -0.7190780639648438, -0.689727783203125, -0.6603775024414062, -0.6310272216796875, -0.6016769409179688, -0.57232666015625, -0.5429763793945312, -0.5136260986328125, -0.48427581787109375, -0.454925537109375, -0.42557525634765625, -0.3962249755859375, -0.36687469482421875, -0.3375244140625, -0.30817413330078125, -0.2788238525390625, -0.24947357177734375, -0.220123291015625, -0.19077301025390625, -0.1614227294921875, -0.13207244873046875, -0.10272216796875, -0.07337188720703125, -0.0440216064453125, -0.01467132568359375, 0.014678955078125, 0.04402923583984375, 0.0733795166015625, 0.10272979736328125, 0.132080078125, 0.16143035888671875, 0.1907806396484375, 0.22013092041015625, 0.249481201171875, 0.27883148193359375, 0.3081817626953125, 0.33753204345703125, 0.36688232421875, 0.39623260498046875, 0.4255828857421875, 0.45493316650390625, 0.484283447265625, 0.5136337280273438, 0.5429840087890625, 0.5723342895507812, 0.6016845703125, 0.6310348510742188, 0.6603851318359375, 0.6897354125976562, 0.719085693359375, 0.7484359741210938, 0.7777862548828125, 0.8071365356445312, 0.83648681640625, 0.8658370971679688, 0.8951873779296875, 0.9245376586914062, 0.953887939453125, 0.9832382202148438, 1.0125885009765625, 1.0419387817382812, 1.0712890625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 3.0, 9.0, 3.0, 20.0, 26.0, 27.0, 57.0, 95.0, 238.0, 827.0, 3768.0, 7826143.0, 552734.0, 3492.0, 709.0, 229.0, 84.0, 50.0, 30.0, 14.0, 7.0, 3.0, 6.0, 3.0, 3.0, 6.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.961023330688477, -11.628612518310547, -11.2962007522583, -10.963789939880371, -10.631378173828125, -10.298967361450195, -9.96655559539795, -9.63414478302002, -9.301733016967773, -8.969322204589844, -8.636910438537598, -8.304499626159668, -7.972087860107422, -7.639677047729492, -7.307265758514404, -6.974854469299316, -6.642443656921387, -6.310032367706299, -5.977621078491211, -5.645209789276123, -5.312798500061035, -4.9803876876831055, -4.647976398468018, -4.31556510925293, -3.983153820037842, -3.650742530822754, -3.318331241607666, -2.9859201908111572, -2.6535089015960693, -2.3210976123809814, -1.988686442375183, -1.6562752723693848, -1.3238630294799805, -0.9914517998695374, -0.6590405702590942, -0.3266293406486511, 0.005781888961791992, 0.3381931781768799, 0.6706043481826782, 1.0030155181884766, 1.3354268074035645, 1.6678380966186523, 2.0002493858337402, 2.332660436630249, 2.665071725845337, 2.997483015060425, 3.3298940658569336, 3.6623053550720215, 3.9947166442871094, 4.327127933502197, 4.659539222717285, 4.991950511932373, 5.324361801147461, 5.656772613525391, 5.9891839027404785, 6.321595191955566, 6.654006481170654, 6.986417770385742, 7.31882905960083, 7.651240348815918, 7.983651161193848, 8.316062927246094, 8.648473739624023, 8.980884552001953, 9.3132963180542]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 2.0, 3.0, 4.0, 1.0, 3.0, 4.0, 5.0, 5.0, 7.0, 6.0, 7.0, 5.0, 2.0, 1.0, 3.0, 5.0, 2.0, 3.0, 3.0, 0.0, 1.0], "bins": [-18.021726608276367, -17.648488998413086, -17.275251388549805, -16.902015686035156, -16.528778076171875, -16.155540466308594, -15.782302856445312, -15.409066200256348, -15.035829544067383, -14.662591934204102, -14.289355278015137, -13.916117668151855, -13.54288101196289, -13.16964340209961, -12.796405792236328, -12.423169136047363, -12.049931526184082, -11.6766939163208, -11.303457260131836, -10.930219650268555, -10.55698299407959, -10.183745384216309, -9.810508728027344, -9.437271118164062, -9.064033508300781, -8.6907958984375, -8.317559242248535, -7.944321632385254, -7.571084976196289, -7.197847366333008, -6.824610233306885, -6.451373100280762, -6.078135967254639, -5.704898834228516, -5.331661701202393, -4.9584245681762695, -4.585186958312988, -4.211950302124023, -3.838712692260742, -3.465475559234619, -3.092238426208496, -2.719001293182373, -2.34576416015625, -1.9725267887115479, -1.5992896556854248, -1.2260525226593018, -0.8528151512145996, -0.47957801818847656, -0.10634088516235352, 0.2668963074684143, 0.6401335000991821, 1.0133707523345947, 1.3866078853607178, 1.7598450183868408, 2.133082389831543, 2.506319522857666, 2.879556655883789, 3.252793788909912, 3.626030921936035, 3.9992682933807373, 4.372505187988281, 4.7457427978515625, 5.1189799308776855, 5.492217063903809, 5.865454196929932]}, "gradients/encoder.masked_spec_embed": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 7.0, 10.0, 8.0, 6.0, 20.0, 20.0, 21.0, 33.0, 26.0, 44.0, 30.0, 34.0, 37.0, 48.0, 47.0, 54.0, 43.0, 50.0, 65.0, 50.0, 50.0, 42.0, 40.0, 34.0, 38.0, 25.0, 22.0, 17.0, 19.0, 10.0, 10.0, 12.0, 10.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.282470703125, -0.27215576171875, -0.2618408203125, -0.25152587890625, -0.2412109375, -0.23089599609375, -0.2205810546875, -0.21026611328125, -0.199951171875, -0.18963623046875, -0.1793212890625, -0.16900634765625, -0.15869140625, -0.14837646484375, -0.1380615234375, -0.12774658203125, -0.117431640625, -0.10711669921875, -0.0968017578125, -0.08648681640625, -0.076171875, -0.06585693359375, -0.0555419921875, -0.04522705078125, -0.034912109375, -0.02459716796875, -0.0142822265625, -0.00396728515625, 0.00634765625, 0.01666259765625, 0.0269775390625, 0.03729248046875, 0.047607421875, 0.05792236328125, 0.0682373046875, 0.07855224609375, 0.0888671875, 0.09918212890625, 0.1094970703125, 0.11981201171875, 0.130126953125, 0.14044189453125, 0.1507568359375, 0.16107177734375, 0.17138671875, 0.18170166015625, 0.1920166015625, 0.20233154296875, 0.212646484375, 0.22296142578125, 0.2332763671875, 0.24359130859375, 0.25390625, 0.26422119140625, 0.2745361328125, 0.28485107421875, 0.295166015625, 0.30548095703125, 0.3157958984375, 0.32611083984375, 0.33642578125, 0.34674072265625, 0.3570556640625, 0.36737060546875, 0.377685546875]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 8.0, 7.0, 20.0, 22.0, 36.0, 42.0, 95.0, 193.0, 370.0, 791.0, 2171.0, 7237.0, 32454.0, 168543.0, 243089.0, 53564.0, 11159.0, 2804.0, 919.0, 336.0, 171.0, 77.0, 55.0, 28.0, 21.0, 17.0, 7.0, 6.0, 9.0, 7.0, 8.0, 3.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.361572265625, -6.09814453125, -5.834716796875, -5.5712890625, -5.307861328125, -5.04443359375, -4.781005859375, -4.517578125, -4.254150390625, -3.99072265625, -3.727294921875, -3.4638671875, -3.200439453125, -2.93701171875, -2.673583984375, -2.41015625, -2.146728515625, -1.88330078125, -1.619873046875, -1.3564453125, -1.093017578125, -0.82958984375, -0.566162109375, -0.302734375, -0.039306640625, 0.22412109375, 0.487548828125, 0.7509765625, 1.014404296875, 1.27783203125, 1.541259765625, 1.8046875, 2.068115234375, 2.33154296875, 2.594970703125, 2.8583984375, 3.121826171875, 3.38525390625, 3.648681640625, 3.912109375, 4.175537109375, 4.43896484375, 4.702392578125, 4.9658203125, 5.229248046875, 5.49267578125, 5.756103515625, 6.01953125, 6.282958984375, 6.54638671875, 6.809814453125, 7.0732421875, 7.336669921875, 7.60009765625, 7.863525390625, 8.126953125, 8.390380859375, 8.65380859375, 8.917236328125, 9.1806640625, 9.444091796875, 9.70751953125, 9.970947265625, 10.234375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 7.0, 5.0, 6.0, 14.0, 18.0, 12.0, 13.0, 22.0, 21.0, 22.0, 38.0, 34.0, 37.0, 49.0, 36.0, 45.0, 65.0, 53.0, 66.0, 58.0, 35.0, 57.0, 44.0, 35.0, 33.0, 35.0, 30.0, 23.0, 10.0, 18.0, 17.0, 7.0, 8.0, 8.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.87646484375, -0.850372314453125, -0.82427978515625, -0.798187255859375, -0.7720947265625, -0.746002197265625, -0.71990966796875, -0.693817138671875, -0.667724609375, -0.641632080078125, -0.61553955078125, -0.589447021484375, -0.5633544921875, -0.537261962890625, -0.51116943359375, -0.485076904296875, -0.458984375, -0.432891845703125, -0.40679931640625, -0.380706787109375, -0.3546142578125, -0.328521728515625, -0.30242919921875, -0.276336669921875, -0.250244140625, -0.224151611328125, -0.19805908203125, -0.171966552734375, -0.1458740234375, -0.119781494140625, -0.09368896484375, -0.067596435546875, -0.04150390625, -0.015411376953125, 0.01068115234375, 0.036773681640625, 0.0628662109375, 0.088958740234375, 0.11505126953125, 0.141143798828125, 0.167236328125, 0.193328857421875, 0.21942138671875, 0.245513916015625, 0.2716064453125, 0.297698974609375, 0.32379150390625, 0.349884033203125, 0.3759765625, 0.402069091796875, 0.42816162109375, 0.454254150390625, 0.4803466796875, 0.506439208984375, 0.53253173828125, 0.558624267578125, 0.584716796875, 0.610809326171875, 0.63690185546875, 0.662994384765625, 0.6890869140625, 0.715179443359375, 0.74127197265625, 0.767364501953125, 0.79345703125]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 4.0, 8.0, 15.0, 32.0, 60.0, 85.0, 125.0, 81.0, 37.0, 18.0, 12.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.675508499145508, -8.344514846801758, -8.013520240783691, -7.682526588439941, -7.351532459259033, -7.020538330078125, -6.689544677734375, -6.358550548553467, -6.027556419372559, -5.69656229019165, -5.3655686378479, -5.034574508666992, -4.703580379486084, -4.372586250305176, -4.041592597961426, -3.7105984687805176, -3.3796048164367676, -3.0486109256744385, -2.7176167964935303, -2.386622905731201, -2.055628776550293, -1.7246348857879639, -1.3936409950256348, -1.0626468658447266, -0.7316529750823975, -0.4006589949131012, -0.06966501474380493, 0.26132893562316895, 0.5923229455947876, 0.9233169555664062, 1.2543108463287354, 1.5853049755096436, 1.9162988662719727, 2.2472927570343018, 2.57828688621521, 2.909280776977539, 3.2402749061584473, 3.5712687969207764, 3.9022626876831055, 4.233256816864014, 4.564250946044922, 4.89524507522583, 5.22623872756958, 5.557232856750488, 5.8882269859313965, 6.219221115112305, 6.550214767456055, 6.881208896636963, 7.212202548980713, 7.543196678161621, 7.874190330505371, 8.205184936523438, 8.536178588867188, 8.867172241210938, 9.198165893554688, 9.529160499572754, 9.860154151916504, 10.191147804260254, 10.52214241027832, 10.85313606262207, 11.18412971496582, 11.515124320983887, 11.846117973327637, 12.177112579345703, 12.508106231689453]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 1.0, 5.0, 4.0, 3.0, 8.0, 15.0, 19.0, 61.0, 76.0, 120.0, 81.0, 30.0, 15.0, 7.0, 3.0, 7.0, 5.0, 7.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.476879596710205, -5.25417423248291, -5.031468391418457, -4.808763027191162, -4.586057662963867, -4.363351821899414, -4.140646457672119, -3.917940855026245, -3.695235252380371, -3.472529649734497, -3.249824047088623, -3.027118682861328, -2.804413080215454, -2.58170747756958, -2.359002113342285, -2.136296510696411, -1.913590908050537, -1.690885305404663, -1.4681798219680786, -1.2454743385314941, -1.0227687358856201, -0.8000631332397461, -0.5773576498031616, -0.35465216636657715, -0.13194656372070312, 0.09075897932052612, 0.31346452236175537, 0.5361700654029846, 0.7588756084442139, 0.9815812110900879, 1.2042866945266724, 1.4269921779632568, 1.6496973037719727, 1.8724029064178467, 2.0951085090637207, 2.3178138732910156, 2.5405194759368896, 2.7632250785827637, 2.9859304428100586, 3.2086360454559326, 3.4313416481018066, 3.6540472507476807, 3.8767528533935547, 4.09945821762085, 4.3221635818481445, 4.544869422912598, 4.767574787139893, 4.9902801513671875, 5.212985992431641, 5.4356913566589355, 5.658397197723389, 5.881102561950684, 6.103808403015137, 6.326513767242432, 6.549219131469727, 6.77192497253418, 6.994630336761475, 7.2173357009887695, 7.440041542053223, 7.662746906280518, 7.8854522705078125, 8.108158111572266, 8.330863952636719, 8.553568840026855, 8.776274681091309]}, "eval/loss": 3.9967808723449707, "eval/wer": 1.6151527171757238, "eval/runtime": 586.6262, "eval/samples_per_second": 4.504, "eval/steps_per_second": 0.564} \ No newline at end of file